npm - @chllming/wave-orchestration - Versions diffs - 0.6.2 → 0.7.0 - Mend

@chllming/wave-orchestration 0.6.2 → 0.7.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (116) hide show

package/CHANGELOG.md +64 -1
package/README.md +44 -8
package/docs/agents/wave-orchestrator-role.md +50 -0
package/docs/agents/wave-planner-role.md +39 -0
package/docs/context7/bundles.json +9 -0
package/docs/context7/planner-agent/README.md +25 -0
package/docs/context7/planner-agent/manifest.json +83 -0
package/docs/context7/planner-agent/papers/cooperbench-why-coding-agents-cannot-be-your-teammates-yet.md +3283 -0
package/docs/context7/planner-agent/papers/dova-deliberation-first-multi-agent-orchestration-for-autonomous-research-automation.md +1699 -0
package/docs/context7/planner-agent/papers/dpbench-large-language-models-struggle-with-simultaneous-coordination.md +2251 -0
package/docs/context7/planner-agent/papers/incremental-planning-to-control-a-blackboard-based-problem-solver.md +1729 -0
package/docs/context7/planner-agent/papers/silo-bench-a-scalable-environment-for-evaluating-distributed-coordination-in-multi-agent-llm-systems.md +3747 -0
package/docs/context7/planner-agent/papers/todoevolve-learning-to-architect-agent-planning-systems.md +1675 -0
package/docs/context7/planner-agent/papers/verified-multi-agent-orchestration-a-plan-execute-verify-replan-framework-for-complex-query-resolution.md +1173 -0
package/docs/context7/planner-agent/papers/why-do-multi-agent-llm-systems-fail.md +5211 -0
package/docs/context7/planner-agent/topics/planning-and-orchestration.md +24 -0
package/docs/evals/README.md +96 -1
package/docs/evals/arm-templates/README.md +13 -0
package/docs/evals/arm-templates/full-wave.json +15 -0
package/docs/evals/arm-templates/single-agent.json +15 -0
package/docs/evals/benchmark-catalog.json +7 -0
package/docs/evals/cases/README.md +47 -0
package/docs/evals/cases/wave-blackboard-inbox-targeting.json +73 -0
package/docs/evals/cases/wave-contradiction-conflict.json +104 -0
package/docs/evals/cases/wave-expert-routing-preservation.json +69 -0
package/docs/evals/cases/wave-hidden-profile-private-evidence.json +81 -0
package/docs/evals/cases/wave-premature-closure-guard.json +71 -0
package/docs/evals/cases/wave-silo-cross-agent-state.json +77 -0
package/docs/evals/cases/wave-simultaneous-lockstep.json +92 -0
package/docs/evals/cooperbench/real-world-mitigation.md +341 -0
package/docs/evals/external-benchmarks.json +85 -0
package/docs/evals/external-command-config.sample.json +9 -0
package/docs/evals/external-command-config.swe-bench-pro.json +8 -0
package/docs/evals/pilots/README.md +47 -0
package/docs/evals/pilots/swe-bench-pro-public-full-wave-review-10.json +64 -0
package/docs/evals/pilots/swe-bench-pro-public-pilot.json +111 -0
package/docs/evals/wave-benchmark-program.md +302 -0
package/docs/guides/planner.md +48 -11
package/docs/plans/context7-wave-orchestrator.md +20 -0
package/docs/plans/current-state.md +9 -1
package/docs/plans/examples/wave-benchmark-improvement.md +108 -0
package/docs/plans/examples/wave-example-live-proof.md +1 -1
package/docs/plans/examples/wave-example-rollout-fidelity.md +340 -0
package/docs/plans/wave-orchestrator.md +73 -11
package/docs/plans/waves/reviews/wave-1-benchmark-operator.md +118 -0
package/docs/reference/coordination-and-closure.md +436 -0
package/docs/reference/live-proof-waves.md +25 -3
package/docs/reference/npmjs-trusted-publishing.md +3 -3
package/docs/reference/proof-metrics.md +90 -0
package/docs/reference/runtime-config/README.md +61 -0
package/docs/reference/sample-waves.md +29 -18
package/docs/reference/wave-control.md +164 -0
package/docs/reference/wave-planning-lessons.md +131 -0
package/package.json +5 -4
package/releases/manifest.json +33 -0
package/scripts/research/agent-context-archive.mjs +18 -0
package/scripts/research/manifests/agent-context-expanded-2026-03-22.mjs +17 -0
package/scripts/research/sync-planner-context7-bundle.mjs +133 -0
package/scripts/wave-autonomous.mjs +2 -4
package/scripts/wave-orchestrator/adhoc.mjs +32 -11
package/scripts/wave-orchestrator/artifact-schemas.mjs +232 -0
package/scripts/wave-orchestrator/autonomous.mjs +27 -6
package/scripts/wave-orchestrator/benchmark-cases.mjs +374 -0
package/scripts/wave-orchestrator/benchmark-external.mjs +1384 -0
package/scripts/wave-orchestrator/benchmark.mjs +972 -0
package/scripts/wave-orchestrator/clarification-triage.mjs +78 -12
package/scripts/wave-orchestrator/config.mjs +175 -0
package/scripts/wave-orchestrator/control-cli.mjs +1123 -0
package/scripts/wave-orchestrator/control-plane.mjs +697 -0
package/scripts/wave-orchestrator/coord-cli.mjs +360 -2
package/scripts/wave-orchestrator/coordination-store.mjs +211 -9
package/scripts/wave-orchestrator/coordination.mjs +84 -0
package/scripts/wave-orchestrator/dashboard-renderer.mjs +38 -3
package/scripts/wave-orchestrator/dashboard-state.mjs +22 -0
package/scripts/wave-orchestrator/evals.mjs +23 -0
package/scripts/wave-orchestrator/executors.mjs +3 -2
package/scripts/wave-orchestrator/feedback.mjs +55 -0
package/scripts/wave-orchestrator/install.mjs +253 -26
package/scripts/wave-orchestrator/launcher-closure.mjs +4 -1
package/scripts/wave-orchestrator/launcher-runtime.mjs +24 -21
package/scripts/wave-orchestrator/launcher.mjs +800 -35
package/scripts/wave-orchestrator/package-update-notice.mjs +230 -0
package/scripts/wave-orchestrator/package-version.mjs +32 -0
package/scripts/wave-orchestrator/planner-context.mjs +75 -0
package/scripts/wave-orchestrator/planner.mjs +2270 -136
package/scripts/wave-orchestrator/proof-cli.mjs +195 -0
package/scripts/wave-orchestrator/proof-registry.mjs +317 -0
package/scripts/wave-orchestrator/replay.mjs +10 -4
package/scripts/wave-orchestrator/retry-cli.mjs +184 -0
package/scripts/wave-orchestrator/retry-control.mjs +225 -0
package/scripts/wave-orchestrator/shared.mjs +26 -0
package/scripts/wave-orchestrator/swe-bench-pro-task.mjs +1004 -0
package/scripts/wave-orchestrator/traces.mjs +157 -2
package/scripts/wave-orchestrator/wave-control-client.mjs +532 -0
package/scripts/wave-orchestrator/wave-control-schema.mjs +309 -0
package/scripts/wave-orchestrator/wave-files.mjs +17 -5
package/scripts/wave.mjs +39 -2
package/skills/repo-coding-rules/SKILL.md +1 -0
package/skills/role-cont-eval/SKILL.md +1 -0
package/skills/role-cont-qa/SKILL.md +13 -6
package/skills/role-deploy/SKILL.md +1 -0
package/skills/role-documentation/SKILL.md +4 -0
package/skills/role-implementation/SKILL.md +4 -0
package/skills/role-infra/SKILL.md +2 -1
package/skills/role-integration/SKILL.md +15 -8
package/skills/role-planner/SKILL.md +39 -0
package/skills/role-planner/skill.json +21 -0
package/skills/role-research/SKILL.md +1 -0
package/skills/role-security/SKILL.md +2 -2
package/skills/runtime-claude/SKILL.md +2 -1
package/skills/runtime-codex/SKILL.md +1 -0
package/skills/runtime-local/SKILL.md +2 -0
package/skills/runtime-opencode/SKILL.md +1 -0
package/skills/wave-core/SKILL.md +25 -6
package/skills/wave-core/references/marker-syntax.md +16 -8
package/wave.config.json +45 -0

package/scripts/wave-orchestrator/coordination-store.mjs CHANGED Viewed

@@ -2,7 +2,10 @@ import crypto from "node:crypto";
 import fs from "node:fs";
 import path from "node:path";
 import {
+  DEFAULT_COORDINATION_ACK_TIMEOUT_MS,
+  DEFAULT_COORDINATION_RESOLUTION_STALE_MS,
   REPO_ROOT,
+  buildLanePaths,
   compactSingleLine,
   ensureDirectory,
   readJsonOrNull,
@@ -10,6 +13,7 @@ import {
   truncate,
   writeTextAtomic,
 } from "./shared.mjs";
+import { safeQueueWaveControlEvent } from "./wave-control-client.mjs";
 export const COORDINATION_KIND_VALUES = [
   "request",
@@ -147,6 +151,50 @@ export function appendCoordinationRecord(filePath, rawRecord, defaults = {}) {
   const record = normalizeCoordinationRecord(rawRecord, defaults);
   ensureDirectory(path.dirname(filePath));
   fs.appendFileSync(filePath, `${JSON.stringify(record)}\n`, "utf8");
+  const runIdHint = normalizeString(rawRecord?.runId ?? defaults.runId, "");
+  try {
+    const lanePaths = buildLanePaths(record.lane, {
+      ...(runIdHint ? { adhocRunId: runIdHint } : {}),
+    });
+    if (lanePaths?.waveControl?.captureCoordinationRecords !== false) {
+      safeQueueWaveControlEvent(lanePaths, {
+        category: "coordination",
+        entityType: "coordination_record",
+        entityId: record.id,
+        action: "recorded",
+        source: record.source,
+        actor: record.agentId,
+        recordedAt: record.updatedAt || record.createdAt,
+        identity: {
+          lane: record.lane,
+          wave: record.wave,
+          attempt: record.attempt,
+          agentId: record.agentId,
+          runKind: lanePaths.runKind,
+          runId: lanePaths.runId,
+        },
+        tags: [`kind:${record.kind}`, `status:${record.status}`],
+        data: {
+          kind: record.kind,
+          status: record.status,
+          priority: record.priority,
+          confidence: record.confidence,
+          summary: record.summary,
+          detail: record.detail,
+          targets: record.targets,
+          artifactRefs: record.artifactRefs,
+          dependsOn: record.dependsOn,
+          closureCondition: record.closureCondition,
+          required: record.required,
+          executorId: record.executorId || null,
+          requesterLane: record.requesterLane || null,
+          ownerLane: record.ownerLane || null,
+        },
+      });
+    }
+  } catch {
+    // Telemetry is best-effort and must never block canonical coordination writes.
+  }
   return record;
 }
@@ -311,11 +359,137 @@ export function serializeCoordinationState(state) {
   };
 }
-function renderOpenRecord(record) {
+function parseRecordStartMs(record) {
+  const createdAtMs = Date.parse(record?.createdAt || "");
+  if (Number.isFinite(createdAtMs)) {
+    return createdAtMs;
+  }
+  const updatedAtMs = Date.parse(record?.updatedAt || "");
+  return Number.isFinite(updatedAtMs) ? updatedAtMs : null;
+}
+function formatAgeMs(ageMs) {
+  if (!Number.isFinite(ageMs)) {
+    return "n/a";
+  }
+  const totalSeconds = Math.max(0, Math.floor(ageMs / 1000));
+  if (totalSeconds < 60) {
+    return `${totalSeconds}s`;
+  }
+  const minutes = Math.floor(totalSeconds / 60);
+  if (minutes < 60) {
+    return `${minutes}m`;
+  }
+  const hours = Math.floor(minutes / 60);
+  return `${hours}h ${minutes % 60}m`;
+}
+function isAckTrackedRecord(record) {
+  if (!record || typeof record !== "object") {
+    return false;
+  }
+  if (["clarification-request", "human-feedback", "human-escalation"].includes(record.kind)) {
+    return true;
+  }
+  if (record.kind !== "request") {
+    return false;
+  }
+  return record.source !== "launcher" || isClarificationLinkedRequest(record);
+}
+export function buildCoordinationResponseMetrics(state, options = {}) {
+  const nowMs = Number.isFinite(options.nowMs) ? options.nowMs : Date.now();
+  const ackTimeoutMs = Number.isFinite(options.ackTimeoutMs)
+    ? options.ackTimeoutMs
+    : DEFAULT_COORDINATION_ACK_TIMEOUT_MS;
+  const resolutionStaleMs = Number.isFinite(options.resolutionStaleMs)
+    ? options.resolutionStaleMs
+    : DEFAULT_COORDINATION_RESOLUTION_STALE_MS;
+  const recordMetricsById = new Map();
+  const overdueAckRecordIds = [];
+  const overdueClarificationIds = new Set();
+  let oldestOpenCoordinationAgeMs = null;
+  let oldestUnackedRequestAgeMs = null;
+  for (const record of state?.openRecords || []) {
+    const startMs = parseRecordStartMs(record);
+    const ageMs = Number.isFinite(startMs) ? Math.max(0, nowMs - startMs) : null;
+    const ackTracked = isAckTrackedRecord(record);
+    const ackPending = ackTracked && record.status === "open";
+    const clarificationLinked =
+      record.kind === "clarification-request" || isClarificationLinkedRequest(record);
+    const overdueAck = ackPending && Number.isFinite(ageMs) && ageMs >= ackTimeoutMs;
+    const staleClarification =
+      clarificationLinked && Number.isFinite(ageMs) && ageMs >= resolutionStaleMs;
+    if (Number.isFinite(ageMs)) {
+      oldestOpenCoordinationAgeMs =
+        oldestOpenCoordinationAgeMs === null
+          ? ageMs
+          : Math.max(oldestOpenCoordinationAgeMs, ageMs);
+      if (ackPending) {
+        oldestUnackedRequestAgeMs =
+          oldestUnackedRequestAgeMs === null
+            ? ageMs
+            : Math.max(oldestUnackedRequestAgeMs, ageMs);
+      }
+    }
+    if (overdueAck) {
+      overdueAckRecordIds.push(record.id);
+    }
+    if (staleClarification) {
+      overdueClarificationIds.add(
+        record.kind === "clarification-request"
+          ? record.id
+          : clarificationIdFromClosureCondition(record.closureCondition) || record.id,
+      );
+    }
+    recordMetricsById.set(record.id, {
+      ageMs,
+      ageLabel: formatAgeMs(ageMs),
+      ackTracked,
+      ackPending,
+      overdueAck,
+      clarificationLinked,
+      staleClarification,
+    });
+  }
+  return {
+    ackTimeoutMs,
+    resolutionStaleMs,
+    oldestOpenCoordinationAgeMs,
+    oldestUnackedRequestAgeMs,
+    overdueAckCount: overdueAckRecordIds.length,
+    overdueClarificationCount: overdueClarificationIds.size,
+    overdueAckRecordIds: overdueAckRecordIds.toSorted((a, b) => a.localeCompare(b)),
+    overdueClarificationIds: Array.from(overdueClarificationIds).toSorted((a, b) =>
+      a.localeCompare(b),
+    ),
+    openHumanEscalationCount: (state?.humanEscalations || []).filter((record) =>
+      isOpenCoordinationStatus(record.status),
+    ).length,
+    recordMetricsById,
+  };
+}
+function renderOpenRecord(record, responseMetrics = null) {
   const targets = record.targets.length > 0 ? ` -> ${record.targets.join(", ")}` : "";
   const artifacts =
     record.artifactRefs.length > 0 ? ` [artifacts: ${record.artifactRefs.join(", ")}]` : "";
-  return `- [${record.priority}] ${record.kind}/${record.status} ${record.agentId}${targets}: ${compactSingleLine(record.summary || record.detail || "no summary", 160)}${artifacts}`;
+  const recordMetrics = responseMetrics?.recordMetricsById?.get?.(record.id) || null;
+  const tags = [];
+  if (recordMetrics?.ageLabel && recordMetrics.ageLabel !== "n/a") {
+    tags.push(`age=${recordMetrics.ageLabel}`);
+  }
+  if (recordMetrics?.overdueAck) {
+    tags.push("overdue-ack");
+  }
+  if (recordMetrics?.staleClarification) {
+    tags.push("stale-clarification");
+  }
+  const timing = tags.length > 0 ? ` [${tags.join(", ")}]` : "";
+  return `- [${record.priority}] ${record.kind}/${record.status} ${record.agentId}${targets}${timing} id=${record.id}: ${compactSingleLine(record.summary || record.detail || "no summary", 160)}${artifacts}`;
 }
 function renderActivityRecord(record) {
@@ -345,6 +519,7 @@ export function renderCoordinationBoardProjection({
   state,
   capabilityAssignments = [],
   dependencySnapshot = null,
+  timingOptions = null,
 }) {
   const latestRecords = Array.isArray(state?.latestRecords) ? state.latestRecords : [];
   const openRecords = latestRecords.filter((record) => OPEN_COORDINATION_STATUSES.has(record.status));
@@ -352,16 +527,29 @@ export function renderCoordinationBoardProjection({
   const openAssignments = (capabilityAssignments || []).filter((assignment) => assignment.blocking);
   const openInboundDependencies = dependencySnapshot?.openInbound || [];
   const openOutboundDependencies = dependencySnapshot?.openOutbound || [];
+  const responseMetrics = buildCoordinationResponseMetrics(state, timingOptions || {});
+  const oldestOpenAge =
+    responseMetrics.oldestOpenCoordinationAgeMs === null
+      ? "none"
+      : formatAgeMs(responseMetrics.oldestOpenCoordinationAgeMs);
+  const oldestUnackedAge =
+    responseMetrics.oldestUnackedRequestAgeMs === null
+      ? "none"
+      : formatAgeMs(responseMetrics.oldestUnackedRequestAgeMs);
   return [
     `# Wave ${wave} Message Board`,
     "",
     `- Wave file: \`${waveFile}\``,
     `- Agents: ${(agents || []).map((agent) => agent.agentId).join(", ")}`,
     `- Generated: ${toIsoTimestamp()}`,
+    `- Oldest open coordination age: ${oldestOpenAge}`,
+    `- Oldest unacknowledged request age: ${oldestUnackedAge}`,
+    `- Overdue acknowledgements: ${responseMetrics.overdueAckCount}`,
+    `- Overdue clarification chains: ${responseMetrics.overdueClarificationCount}`,
     "",
     "## Open Coordination State",
     ...(openRecords.length > 0
-      ? openRecords.map((record) => renderOpenRecord(record))
+      ? openRecords.map((record) => renderOpenRecord(record, responseMetrics))
       : ["- None."]),
     "",
     "## Helper Assignments",
@@ -457,6 +645,7 @@ export function compileSharedSummary({
   capabilityAssignments = [],
   dependencySnapshot = null,
   maxChars = 4000,
+  timingOptions = null,
 }) {
   const openBlockers = state.blockers.filter((record) => OPEN_COORDINATION_STATUSES.has(record.status));
   const openRequests = state.requests.filter((record) => OPEN_COORDINATION_STATUSES.has(record.status));
@@ -469,6 +658,7 @@ export function compileSharedSummary({
   const openHelperAssignments = (capabilityAssignments || []).filter((assignment) => assignment.blocking);
   const openInboundDependencies = dependencySnapshot?.openInbound || [];
   const openOutboundDependencies = dependencySnapshot?.openOutbound || [];
+  const responseMetrics = buildCoordinationResponseMetrics(state, timingOptions || {});
   const summary = [
     `# Wave ${wave.wave} Shared Summary`,
     "",
@@ -480,6 +670,10 @@ export function compileSharedSummary({
     `- Open helper assignments: ${openHelperAssignments.length}`,
     `- Open inbound dependencies: ${openInboundDependencies.length}`,
     `- Open outbound dependencies: ${openOutboundDependencies.length}`,
+    `- Oldest open coordination age: ${responseMetrics.oldestOpenCoordinationAgeMs === null ? "none" : formatAgeMs(responseMetrics.oldestOpenCoordinationAgeMs)}`,
+    `- Oldest unacknowledged request age: ${responseMetrics.oldestUnackedRequestAgeMs === null ? "none" : formatAgeMs(responseMetrics.oldestUnackedRequestAgeMs)}`,
+    `- Overdue acknowledgements: ${responseMetrics.overdueAckCount}`,
+    `- Overdue clarification chains: ${responseMetrics.overdueClarificationCount}`,
     ...(integrationSummary
       ? [`- Integration recommendation: ${integrationSummary.recommendation || "n/a"}`]
       : []),
@@ -498,12 +692,12 @@ export function compileSharedSummary({
     "",
     "## Current blockers",
     ...(openBlockers.length > 0
-      ? openBlockers.map((record) => renderOpenRecord(record))
+      ? openBlockers.map((record) => renderOpenRecord(record, responseMetrics))
       : ["- None."]),
     "",
     "## Current clarifications",
     ...(openClarifications.length > 0
-      ? openClarifications.map((record) => renderOpenRecord(record))
+      ? openClarifications.map((record) => renderOpenRecord(record, responseMetrics))
       : ["- None."]),
     "",
     "## Helper assignments",
@@ -588,6 +782,7 @@ export function compileAgentInbox({
   capabilityAssignments = [],
   dependencySnapshot = null,
   maxChars = 8000,
+  timingOptions = null,
 }) {
   const targetedRecords = state.openRecords.filter((record) => isTargetedToAgent(record, agent));
   const ownedRecords = (state.recordsByAgentId.get(agent.agentId) || []).filter((record) =>
@@ -624,6 +819,7 @@ export function compileAgentInbox({
   const helperAssignments = (capabilityAssignments || []).filter(
     (assignment) => assignment.blocking && assignment.assignedAgentId === agent.agentId,
   );
+  const responseMetrics = buildCoordinationResponseMetrics(state, timingOptions || {});
   const dependencyItems = [
     ...((dependencySnapshot?.inbound || []).filter(
       (record) =>
@@ -641,24 +837,30 @@ export function compileAgentInbox({
   const text = [
     `# Wave ${wave.wave} Inbox for ${agent.agentId}`,
     "",
+    "## Response timing",
+    `- Oldest open coordination age: ${responseMetrics.oldestOpenCoordinationAgeMs === null ? "none" : formatAgeMs(responseMetrics.oldestOpenCoordinationAgeMs)}`,
+    `- Oldest unacknowledged request age: ${responseMetrics.oldestUnackedRequestAgeMs === null ? "none" : formatAgeMs(responseMetrics.oldestUnackedRequestAgeMs)}`,
+    `- Overdue acknowledgements: ${responseMetrics.overdueAckCount}`,
+    `- Overdue clarification chains: ${responseMetrics.overdueClarificationCount}`,
+    "",
     "## Targeted open coordination",
     ...(targetedRecords.length > 0
-      ? targetedRecords.map((record) => renderOpenRecord(record))
+      ? targetedRecords.map((record) => renderOpenRecord(record, responseMetrics))
       : ["- None."]),
     "",
     "## Your open coordination items",
     ...(ownedRecords.length > 0
-      ? ownedRecords.map((record) => renderOpenRecord(record))
+      ? ownedRecords.map((record) => renderOpenRecord(record, responseMetrics))
       : ["- None."]),
     "",
     "## Clarifications",
     ...(clarificationRecords.length > 0
-      ? clarificationRecords.map((record) => renderOpenRecord(record))
+      ? clarificationRecords.map((record) => renderOpenRecord(record, responseMetrics))
       : ["- None."]),
     "",
     "## Relevant open coordination",
     ...(relevantRecords.length > 0
-      ? relevantRecords.map((record) => renderOpenRecord(record))
+      ? relevantRecords.map((record) => renderOpenRecord(record, responseMetrics))
       : ["- None."]),
     "",
     "## Helper assignments",

package/scripts/wave-orchestrator/coordination.mjs CHANGED Viewed

@@ -455,6 +455,7 @@ export function buildExecutionPrompt({
     "- Follow repository instructions in AGENTS.md and CLAUDE.md if present.",
     "- Read the compiled shared summary and your compiled inbox before taking action on every turn.",
     "- Post a coordination record on every meaningful turn with progress, decisions, blockers, handoffs, evidence, or explicit acknowledgement.",
+    "- If your inbox or the coordination log shows a targeted open request for you, your first durable action is to acknowledge it, resolve it, or emit a clarification or human-feedback request. Silent targeted requests are treated as active blockers.",
     "- Re-read the generated board projection before major edits, before commit or push, and before your final report.",
     "- If you change interfaces or contracts, include exact files and exact keys or fields affected.",
     "- If your task touches persisted state, implement the required schema or migration work instead of leaving TODOs.",
@@ -511,6 +512,89 @@ export function buildExecutionPrompt({
   ].join("\n");
 }
+export function buildResidentOrchestratorPrompt({
+  lane,
+  wave,
+  waveFile,
+  orchestratorId,
+  coordinationLogPath,
+  messageBoardPath,
+  sharedSummaryPath,
+  dashboardPath,
+  triagePath = null,
+  rolePrompt = "",
+}) {
+  const coordinationCommand = [
+    "pnpm exec wave coord post",
+    `--lane ${lane}`,
+    `--wave ${wave}`,
+    '--agent "launcher"',
+    '--kind "<request|ack|decision|blocker|clarification-request|orchestrator-guidance|resolved-by-policy|human-escalation|human-feedback>"',
+    '--summary "<one-line summary>"',
+    '--detail "<short detail>"',
+  ].join(" ");
+  const feedbackCommand = [
+    "pnpm exec wave-feedback ask",
+    `--lane ${lane}`,
+    `--wave ${wave}`,
+    '--agent "launcher"',
+    `--orchestrator-id ${orchestratorId}`,
+    '--question "<specific clarification needed>"',
+    '--context "<why repo-state or routed ownership was insufficient>"',
+    "--timeout-seconds 30",
+  ].join(" ");
+  const roleSection = String(rolePrompt || "").trim();
+  return [
+    `Working directory: ${REPO_ROOT}`,
+    "",
+    `You are the resident Wave orchestrator for lane ${lane}, wave ${wave}.`,
+    "Your job is to stay alive for the duration of the wave, monitor coordination state, and intervene when timing, routing, or escalation policy requires it.",
+    "The launcher remains the scheduler truth and closure authority. You are an intervention and triage role, not a product-code owner.",
+    "",
+    "Hard limits:",
+    "- Do not edit product code, test code, docs, or owned deliverables.",
+    "- Do not claim another agent's ownership slice or emit proof markers for owned implementation work.",
+    "- Do not declare the wave complete or override launcher gate results.",
+    "",
+    "Primary responsibilities:",
+    "- Monitor the canonical coordination log, shared summary, wave dashboard, and feedback triage artifacts.",
+    "- Keep clarification handling orchestrator-first: resolve from repo state, ownership, prior decisions, or targeted rerouting before opening human escalation.",
+    "- Watch for overdue acknowledgements, stale clarification chains, and pending human tickets.",
+    "- Post durable coordination records and orchestrator notes when you intervene.",
+    "- Stay available. If there is no immediate action to take, keep monitoring instead of exiting early.",
+    "",
+    "Files for this run:",
+    `- Wave file: ${waveFile}`,
+    `- Coordination log: ${coordinationLogPath}`,
+    `- Shared summary: ${sharedSummaryPath}`,
+    `- Wave dashboard: ${dashboardPath}`,
+    `- Message board projection: ${messageBoardPath}`,
+    ...(triagePath ? [`- Feedback triage log: ${triagePath}`] : []),
+    "",
+    "Action surface:",
+    `- Coordination command: \`${coordinationCommand}\``,
+    `- Human feedback command: \`${feedbackCommand}\``,
+    "- Use repository inspection and read-only analysis aggressively before escalating anything to a human.",
+    "- When you route or reroute work, name the owner, exact unblock condition, and the artifact or decision needed.",
+    "",
+    "Operating loop:",
+    "1. Read the shared summary, dashboard, and coordination log.",
+    "2. Identify open clarifications, open clarification-linked requests, overdue acknowledgements, and human-feedback state.",
+    "3. If action is needed, write a durable coordination update and explain the policy basis for the action.",
+    "4. If nothing needs action, continue monitoring. Do not exit until the wave is clearly terminal or the launcher stops the session.",
+    "",
+    ...(roleSection
+      ? [
+          "Resident orchestrator role prompt:",
+          "```text",
+          roleSection,
+          "```",
+          "",
+        ]
+      : []),
+  ].join("\n");
+}
 export function buildOrchestratorBoardTemplate(boardPath) {
   const now = toIsoTimestamp();
   return [

package/scripts/wave-orchestrator/dashboard-renderer.mjs CHANGED Viewed

@@ -182,6 +182,22 @@ function paintWaveAgentSummary(summary, wave, colorize = false) {
   return paint(summary, color, colorize);
 }
+function formatDurationMs(value) {
+  if (!Number.isFinite(value)) {
+    return "n/a";
+  }
+  const totalSeconds = Math.max(0, Math.floor(value / 1000));
+  if (totalSeconds < 60) {
+    return `${totalSeconds}s`;
+  }
+  const minutes = Math.floor(totalSeconds / 60);
+  if (minutes < 60) {
+    return `${minutes}m`;
+  }
+  const hours = Math.floor(minutes / 60);
+  return `${hours}h ${minutes % 60}m`;
+}
 function renderWaveDashboard({ state, dashboardPath, messageBoardPath, lane, colorize = false }) {
   if (!state) {
     return `Dashboard file not found or invalid: ${dashboardPath}`;
@@ -200,15 +216,21 @@ function renderWaveDashboard({ state, dashboardPath, messageBoardPath, lane, col
   );
   lines.push(`Run tag: ${state.runTag || "n/a"} | Wave file: ${state.waveFile || "n/a"}`);
   lines.push(`Counts: ${renderColoredCountsByState(state.agents || [], colorize) || "none"}`);
+  lines.push(
+    `Coordination: open=${state.coordinationOpen ?? 0} clarifications=${state.openClarifications ?? 0} human=${state.openHumanEscalations ?? 0} overdue-ack=${state.overdueAckCount ?? 0} overdue-clarification=${state.overdueClarificationCount ?? 0}`,
+  );
+  lines.push(
+    `Coordination age: oldest-open=${formatDurationMs(state.oldestOpenCoordinationAgeMs)} oldest-unack=${formatDurationMs(state.oldestUnackedRequestAgeMs)}`,
+  );
   const comms = analyzeMessageBoardCommunication(messageBoardPath);
   if (!comms.available) {
-    lines.push(`Comms: unavailable ${comms.reason || ""}`.trim());
+    lines.push(`Board comms: unavailable ${comms.reason || ""}`.trim());
   } else {
     lines.push(
-      `Comms: requests=${comms.actionableRequests} unresolved=${comms.unresolvedRequests} unacknowledged=${comms.unacknowledgedRequests} malformed=${comms.malformedEntries} placeholder-ts=${comms.placeholderTimestampEntries}`,
+      `Board comms: requests=${comms.actionableRequests} unresolved=${comms.unresolvedRequests} unacknowledged=${comms.unacknowledgedRequests} malformed=${comms.malformedEntries} placeholder-ts=${comms.placeholderTimestampEntries}`,
     );
     lines.push(
-      `Comms age: last-ack=${commsAgeSummary(comms.lastAcknowledgementTimestamp)} oldest-unack=${commsAgeSummary(comms.oldestUnacknowledgedTimestamp)}`,
+      `Board comms age: last-ack=${commsAgeSummary(comms.lastAcknowledgementTimestamp)} oldest-unack=${commsAgeSummary(comms.oldestUnacknowledgedTimestamp)}`,
     );
   }
   lines.push("");
@@ -306,6 +328,19 @@ function renderGlobalDashboard({ state, dashboardPath, lane, colorize = false })
         12,
       )} ${truncate(wave.lastMessage || "", 70)}`,
     );
+    if (
+      Number(wave?.coordinationOpen ?? 0) > 0 ||
+      Number(wave?.overdueAckCount ?? 0) > 0 ||
+      Number(wave?.overdueClarificationCount ?? 0) > 0 ||
+      Number(wave?.openHumanEscalations ?? 0) > 0
+    ) {
+      lines.push(
+        `      Coord: open ${wave.coordinationOpen ?? 0} clarifications ${wave.openClarifications ?? 0} human ${wave.openHumanEscalations ?? 0} overdue-ack ${wave.overdueAckCount ?? 0} overdue-clarification ${wave.overdueClarificationCount ?? 0}`,
+      );
+      lines.push(
+        `      Ages: oldest-open ${formatDurationMs(wave.oldestOpenCoordinationAgeMs)} oldest-unack ${formatDurationMs(wave.oldestUnackedRequestAgeMs)}`,
+      );
+    }
     const deployments = Array.isArray(wave.deployments) ? wave.deployments : [];
     if (deployments.length > 0) {
       const deployLine = deployments

package/scripts/wave-orchestrator/dashboard-state.mjs CHANGED Viewed

@@ -149,6 +149,13 @@ export function buildWaveDashboardState({
     helperAssignmentsOpen: 0,
     inboundDependenciesOpen: 0,
     outboundDependenciesOpen: 0,
+    coordinationOpen: 0,
+    openClarifications: 0,
+    openHumanEscalations: 0,
+    oldestOpenCoordinationAgeMs: null,
+    oldestUnackedRequestAgeMs: null,
+    overdueAckCount: 0,
+    overdueClarificationCount: 0,
     agents: agentRuns.map((run) => ({
       agentId: run.agent.agentId,
       title: run.agent.title,
@@ -200,6 +207,7 @@ export function buildGlobalDashboardState({
       maxRetriesPerWave: options.maxRetriesPerWave,
       dashboard: options.dashboard,
       cleanupSessions: options.cleanupSessions,
+      residentOrchestrator: options.residentOrchestrator === true,
       orchestratorId: options.orchestratorId,
       orchestratorBoardPath: options.orchestratorBoardPath
         ? path.relative(REPO_ROOT, options.orchestratorBoardPath)
@@ -235,6 +243,13 @@ export function buildGlobalDashboardState({
       helperAssignmentsOpen: 0,
       inboundDependenciesOpen: 0,
       outboundDependenciesOpen: 0,
+      coordinationOpen: 0,
+      openClarifications: 0,
+      openHumanEscalations: 0,
+      oldestOpenCoordinationAgeMs: null,
+      oldestUnackedRequestAgeMs: null,
+      overdueAckCount: 0,
+      overdueClarificationCount: 0,
       lastMessage: "",
       deployments: [],
       infraFindings: [],
@@ -323,6 +338,13 @@ export function syncGlobalWaveFromWaveDashboard(globalState, waveDashboard) {
   entry.helperAssignmentsOpen = waveDashboard.helperAssignmentsOpen || 0;
   entry.inboundDependenciesOpen = waveDashboard.inboundDependenciesOpen || 0;
   entry.outboundDependenciesOpen = waveDashboard.outboundDependenciesOpen || 0;
+  entry.coordinationOpen = waveDashboard.coordinationOpen || 0;
+  entry.openClarifications = waveDashboard.openClarifications || 0;
+  entry.openHumanEscalations = waveDashboard.openHumanEscalations || 0;
+  entry.oldestOpenCoordinationAgeMs = waveDashboard.oldestOpenCoordinationAgeMs ?? null;
+  entry.oldestUnackedRequestAgeMs = waveDashboard.oldestUnackedRequestAgeMs ?? null;
+  entry.overdueAckCount = waveDashboard.overdueAckCount || 0;
+  entry.overdueClarificationCount = waveDashboard.overdueClarificationCount || 0;
   entry.deployments = agents
     .filter((agent) => agent.deploymentState)
     .map((agent) => ({

package/scripts/wave-orchestrator/evals.mjs CHANGED Viewed

@@ -351,6 +351,12 @@ export function loadBenchmarkCatalog(options = {}) {
         id: benchmarkId,
         title: cleanText(benchmark.title) || benchmarkId,
         summary: cleanText(benchmark.summary) || null,
+        localCases: normalizeStringArray(
+          benchmark.localCases,
+          `families.${familyId}.benchmarks.${benchmarkId}.localCases`,
+        ).map((entry, index) =>
+          normalizeEvalTargetId(entry, `families.${familyId}.benchmarks.${benchmarkId}.localCases[${index}]`),
+        ),
         goal: cleanText(benchmark.goal) || null,
         failureModes: normalizeStringArray(
           benchmark.failureModes,
@@ -380,6 +386,12 @@ export function loadBenchmarkCatalog(options = {}) {
       id: familyId,
       title: cleanText(rawFamily.title) || familyId,
       summary: cleanText(rawFamily.summary) || null,
+      localCases: normalizeStringArray(
+        rawFamily.localCases,
+        `families.${familyId}.localCases`,
+      ).map((entry, index) =>
+        normalizeEvalTargetId(entry, `families.${familyId}.localCases[${index}]`),
+      ),
       category: cleanText(rawFamily.category) || null,
       coordinationModel: cleanText(rawFamily.coordinationModel) || null,
       primaryMetric: familyPrimaryMetric,
@@ -395,6 +407,17 @@ export function loadBenchmarkCatalog(options = {}) {
     absolutePath,
     families,
     benchmarkIndex,
+    localCaseIndex: Object.fromEntries(
+      Object.values(families).flatMap((family) => [
+        ...(family.localCases || []).map((caseId) => [caseId, { familyId: family.id, benchmarkId: null }]),
+        ...Object.values(family.benchmarks).flatMap((benchmark) =>
+          (benchmark.localCases || []).map((caseId) => [
+            caseId,
+            { familyId: family.id, benchmarkId: benchmark.id },
+          ]),
+        ),
+      ]),
+    ),
   };
 }

package/scripts/wave-orchestrator/executors.mjs CHANGED Viewed

@@ -210,7 +210,8 @@ function buildClaudeLaunchSpec({ agent, promptPath, logPath, overlayDir }) {
     systemPromptPath,
     `${renderHarnessSystemPrompt(agent, "claude")}${skillText ? `\n\n${skillText}` : ""}\n`,
   );
-  const tokens = [executor.claude.command, "-p", "--no-session-persistence"];
+  const command = executor?.claude?.command || "claude";
+  const tokens = [command, "-p", "--no-session-persistence"];
   const settingsPath = buildClaudeSettingsPath(executor, overlayDir);
   appendSingleValueFlag(tokens, "--output-format", executor.claude.outputFormat || "text");
   appendSingleValueFlag(tokens, "--model", executor.claude.model || executor.model);
@@ -234,7 +235,7 @@ function buildClaudeLaunchSpec({ agent, promptPath, logPath, overlayDir }) {
   );
   return {
     executorId: "claude",
-    command: executor.claude.command,
+    command,
     useRateLimitRetries: true,
     invocationLines: [
       `task_prompt=$(cat ${shellQuote(promptPath)})`,