npm - @llm-dev-ops/agentics-cli - Versions diffs - 2.7.41 → 2.8.0 - Mend

@llm-dev-ops/agentics-cli 2.7.41 → 2.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (195) hide show

package/agents/analytics-hub/consensus/consensus.md +47 -0
package/agents/analytics-hub/recommendation/recommendation.md +47 -0
package/agents/auto-optimizer/model-select/model-select.md +49 -0
package/agents/auto-optimizer/self-optimize/self-optimize.md +44 -0
package/agents/auto-optimizer/token/token.md +50 -0
package/agents/benchmark-exchange/publish/publish.md +29 -0
package/agents/config-manager/validate/validate.md +40 -0
package/agents/connector-hub/auth-identity/auth-identity.md +29 -0
package/agents/connector-hub/database-query/database-query.md +29 -0
package/agents/connector-hub/erp-surface/erp-surface.md +29 -0
package/agents/connector-hub/event-normalize/event-normalize.md +29 -0
package/agents/connector-hub/webhook-ingest/webhook-ingest.md +29 -0
package/agents/copilot/clarifier/clarifier.md +47 -0
package/agents/copilot/config/config.md +37 -0
package/agents/copilot/decomposer/decomposer.md +46 -0
package/agents/copilot/intent/intent.md +43 -0
package/agents/copilot/meta-reasoner/meta-reasoner.md +43 -0
package/agents/copilot/planner/planner.md +47 -0
package/agents/copilot/reflection/reflection.md +40 -0
package/agents/costops/attribution/attribution.md +39 -0
package/agents/costops/budget/budget.md +40 -0
package/agents/costops/forecast/forecast.md +40 -0
package/agents/costops/roi/roi.md +37 -0
package/agents/costops/tradeoff/tradeoff.md +39 -0
package/agents/data-vault/access-control/access-control.md +46 -0
package/agents/data-vault/anonymize/anonymize.md +54 -0
package/agents/edge/caching/caching.md +46 -0
package/agents/edge/circuit-breaker/circuit-breaker.md +44 -0
package/agents/edge/execution-guard/execution-guard.md +41 -0
package/agents/edge/failover/failover.md +45 -0
package/agents/edge/tool-invoke/tool-invoke.md +44 -0
package/agents/forge/api-translation/api-translation.md +29 -0
package/agents/forge/cli/cli.md +29 -0
package/agents/forge/sdk/sdk.md +29 -0
package/agents/forge/version-compat/version-compat.md +29 -0
package/agents/governance-dashboard/audit/audit.md +39 -0
package/agents/governance-dashboard/impact/impact.md +37 -0
package/agents/governance-dashboard/oversight/oversight.md +41 -0
package/agents/incident-manager/escalation/escalation.md +45 -0
package/agents/incident-manager/hitl/hitl.md +46 -0
package/agents/incident-manager/post-mortem/post-mortem.md +52 -0
package/agents/inference-gateway/route/route.md +29 -0
package/agents/latency-lens/cold-start/cold-start.md +29 -0
package/agents/latency-lens/latency/latency.md +29 -0
package/agents/marketplace/deprecation/deprecation.md +29 -0
package/agents/marketplace/package/package.md +29 -0
package/agents/memory-graph/conversation/conversation.md +37 -0
package/agents/memory-graph/decisions/decisions.md +45 -0
package/agents/memory-graph/knowledge-graph/knowledge-graph.md +46 -0
package/agents/memory-graph/lineage/lineage.md +37 -0
package/agents/memory-graph/patterns/patterns.md +45 -0
package/agents/memory-graph/retrieval/retrieval.md +43 -0
package/agents/observatory/failures/failures.md +29 -0
package/agents/observatory/health-check/health-check.md +29 -0
package/agents/observatory/post-mortem/post-mortem.md +29 -0
package/agents/observatory/slo/slo.md +29 -0
package/agents/observatory/telemetry/telemetry.md +29 -0
package/agents/observatory/usage-patterns/usage-patterns.md +29 -0
package/agents/observatory/visualization/visualization.md +29 -0
package/agents/orchestrator/dependencies/dependencies.md +40 -0
package/agents/orchestrator/parallel/parallel.md +43 -0
package/agents/orchestrator/retry/retry.md +45 -0
package/agents/orchestrator/scheduler/scheduler.md +44 -0
package/agents/orchestrator/state-machine/state-machine.md +53 -0
package/agents/orchestrator/swarm/swarm.md +44 -0
package/agents/orchestrator/workflow/workflow.md +48 -0
package/agents/platform/decision/decision.md +40 -0
package/agents/platform/decision-memo/decision-memo.md +69 -0
package/agents/platform/executive-summary/executive-summary.md +44 -0
package/agents/platform/risk-score/risk-score.md +50 -0
package/agents/policy-engine/approval/approval.md +40 -0
package/agents/policy-engine/constraints/constraints.md +38 -0
package/agents/policy-engine/enforce/enforce.md +39 -0
package/agents/registry/bootstrap/bootstrap.md +29 -0
package/agents/registry/index/index.md +29 -0
package/agents/registry/reputation/reputation.md +29 -0
package/agents/research-lab/hypothesis/hypothesis.md +50 -0
package/agents/research-lab/metrics/metrics.md +50 -0
package/agents/schema-registry/validate/validate.md +37 -0
package/agents/sentinel/alert/alert.md +29 -0
package/agents/sentinel/anomaly/anomaly.md +29 -0
package/agents/sentinel/correlation/correlation.md +29 -0
package/agents/sentinel/drift/drift.md +29 -0
package/agents/sentinel/rca/rca.md +29 -0
package/agents/shield/abuse/abuse.md +29 -0
package/agents/shield/credential-exposure/credential-exposure.md +29 -0
package/agents/shield/moderation/moderation.md +29 -0
package/agents/shield/pii/pii.md +29 -0
package/agents/shield/prompt-injection/prompt-injection.md +29 -0
package/agents/shield/redaction/redaction.md +29 -0
package/agents/shield/safety-boundary/safety-boundary.md +29 -0
package/agents/shield/secrets/secrets.md +29 -0
package/agents/shield/toxicity/toxicity.md +29 -0
package/agents/simulator/scenario/scenario.md +53 -0
package/agents/simulator/what-if/what-if.md +52 -0
package/agents/test-bench/adversarial/adversarial.md +33 -0
package/agents/test-bench/benchmark/benchmark.md +34 -0
package/agents/test-bench/bias/bias.md +33 -0
package/agents/test-bench/compare/compare.md +33 -0
package/agents/test-bench/consistency/consistency.md +33 -0
package/agents/test-bench/faithfulness/faithfulness.md +34 -0
package/agents/test-bench/golden-dataset/golden-dataset.md +33 -0
package/agents/test-bench/hallucination/hallucination.md +34 -0
package/agents/test-bench/prompt-sensitivity/prompt-sensitivity.md +33 -0
package/agents/test-bench/quality/quality.md +33 -0
package/agents/test-bench/red-team/red-team.md +33 -0
package/agents/test-bench/regression/regression.md +33 -0
package/agents/test-bench/stress/stress.md +34 -0
package/agents/test-bench/synthetic-data/synthetic-data.md +35 -0
package/dist/agents/agent-prompts.d.ts +77 -0
package/dist/agents/agent-prompts.d.ts.map +1 -0
package/dist/agents/agent-prompts.js +230 -0
package/dist/agents/agent-prompts.js.map +1 -0
package/dist/agents/repo-agent-runner.d.ts +1 -0
package/dist/agents/repo-agent-runner.d.ts.map +1 -1
package/dist/agents/repo-agent-runner.js +67 -35
package/dist/agents/repo-agent-runner.js.map +1 -1
package/dist/cli/index.js +22 -0
package/dist/cli/index.js.map +1 -1
package/dist/commands/agents.d.ts +19 -0
package/dist/commands/agents.d.ts.map +1 -1
package/dist/commands/agents.js +344 -144
package/dist/commands/agents.js.map +1 -1
package/dist/pipeline/auto-chain.d.ts.map +1 -1
package/dist/pipeline/auto-chain.js +18 -7
package/dist/pipeline/auto-chain.js.map +1 -1
package/dist/pipeline/fleet-dispatch-bounds.d.ts +115 -0
package/dist/pipeline/fleet-dispatch-bounds.d.ts.map +1 -0
package/dist/pipeline/fleet-dispatch-bounds.js +190 -0
package/dist/pipeline/fleet-dispatch-bounds.js.map +1 -0
package/dist/pipeline/output-validator.d.ts +7 -2
package/dist/pipeline/output-validator.d.ts.map +1 -1
package/dist/pipeline/output-validator.js +61 -4
package/dist/pipeline/output-validator.js.map +1 -1
package/dist/pipeline/phase2/phases/adr-generator.d.ts.map +1 -1
package/dist/pipeline/phase2/phases/adr-generator.js +6 -5
package/dist/pipeline/phase2/phases/adr-generator.js.map +1 -1
package/dist/pipeline/phase3/phases/domain-codegen.d.ts.map +1 -1
package/dist/pipeline/phase3/phases/domain-codegen.js +8 -2
package/dist/pipeline/phase3/phases/domain-codegen.js.map +1 -1
package/dist/pipeline/phase4/phases/schema-generator.js +3 -3
package/dist/pipeline/phase4/phases/schema-generator.js.map +1 -1
package/dist/pipeline/phase7/coherence-gate.d.ts.map +1 -1
package/dist/pipeline/phase7/coherence-gate.js +8 -24
package/dist/pipeline/phase7/coherence-gate.js.map +1 -1
package/dist/pipeline/phase7/coordinator.d.ts +34 -0
package/dist/pipeline/phase7/coordinator.d.ts.map +1 -1
package/dist/pipeline/phase7/coordinator.js +131 -71
package/dist/pipeline/phase7/coordinator.js.map +1 -1
package/dist/pipeline/phase7/field-mappers.d.ts +43 -0
package/dist/pipeline/phase7/field-mappers.d.ts.map +1 -0
package/dist/pipeline/phase7/field-mappers.js +278 -0
package/dist/pipeline/phase7/field-mappers.js.map +1 -0
package/dist/pipeline/phase7/field-writer.d.ts +53 -0
package/dist/pipeline/phase7/field-writer.d.ts.map +1 -0
package/dist/pipeline/phase7/field-writer.js +178 -0
package/dist/pipeline/phase7/field-writer.js.map +1 -0
package/dist/pipeline/phase7/writer-agent.d.ts +83 -0
package/dist/pipeline/phase7/writer-agent.d.ts.map +1 -0
package/dist/pipeline/phase7/writer-agent.js +174 -0
package/dist/pipeline/phase7/writer-agent.js.map +1 -0
package/dist/pipeline/ruflo-phase-executor.d.ts.map +1 -1
package/dist/pipeline/ruflo-phase-executor.js +49 -23
package/dist/pipeline/ruflo-phase-executor.js.map +1 -1
package/dist/pipeline/swarm-orchestrator.d.ts +3 -41
package/dist/pipeline/swarm-orchestrator.d.ts.map +1 -1
package/dist/pipeline/swarm-orchestrator.js +9 -75
package/dist/pipeline/swarm-orchestrator.js.map +1 -1
package/dist/synthesis/fcv-coherence.d.ts +24 -0
package/dist/synthesis/fcv-coherence.d.ts.map +1 -0
package/dist/synthesis/fcv-coherence.js +36 -0
package/dist/synthesis/fcv-coherence.js.map +1 -0
package/dist/synthesis/financial-claim-extractor.d.ts +8 -0
package/dist/synthesis/financial-claim-extractor.d.ts.map +1 -1
package/dist/synthesis/financial-claim-extractor.js +74 -1
package/dist/synthesis/financial-claim-extractor.js.map +1 -1
package/dist/synthesis/financial-consistency-rules.d.ts.map +1 -1
package/dist/synthesis/financial-consistency-rules.js +21 -12
package/dist/synthesis/financial-consistency-rules.js.map +1 -1
package/dist/synthesis/financial-consistency-runner.d.ts +12 -0
package/dist/synthesis/financial-consistency-runner.d.ts.map +1 -1
package/dist/synthesis/financial-consistency-runner.js +25 -3
package/dist/synthesis/financial-consistency-runner.js.map +1 -1
package/dist/synthesis/simulation-artifact-generator.d.ts.map +1 -1
package/dist/synthesis/simulation-artifact-generator.js +5 -0
package/dist/synthesis/simulation-artifact-generator.js.map +1 -1
package/dist/synthesis/simulation-renderers.d.ts +2 -0
package/dist/synthesis/simulation-renderers.d.ts.map +1 -1
package/dist/synthesis/simulation-renderers.js +8 -8
package/dist/synthesis/simulation-renderers.js.map +1 -1
package/dist/synthesis/unit-economics-loader.d.ts +7 -0
package/dist/synthesis/unit-economics-loader.d.ts.map +1 -1
package/dist/synthesis/unit-economics-loader.js +11 -2
package/dist/synthesis/unit-economics-loader.js.map +1 -1
package/package.json +8 -7

package/dist/commands/agents.js CHANGED Viewed

@@ -13,10 +13,186 @@ import { loadEndpointConfig } from '../config/endpoints.js';
 import { createAdapter } from '../adapters/base-adapter.js';
 import { getAnthropicApiKey } from '../utils/credentials.js';
 import { executeSimulateCommand } from './simulate.js';
-import { execFileSync } from 'node:child_process';
+import { execFile } from 'node:child_process';
+import { promisify } from 'node:util';
+import { writeFileSync as fsWriteFileSync, existsSync as fsExistsSync, readFileSync as fsReadFileSync } from 'node:fs';
+import { join as pathJoin } from 'node:path';
 import { isTransientFailure, isTerminalFailure } from '../errors/transient.js';
 import { recordDegradation, drainDegradations } from '../observability/degradations.js';
 import { computePhase1Verdict } from '../pipeline/phase1-verdict.js';
+// ADR-PIPELINE-108: shared dispatch bounds (per-agent timeout + cloud breaker).
+import { CloudCircuitBreaker, resolveFleetDispatchConfig, withAgentTimeout, AGENT_TIMED_OUT, raceFleetDeadline, decideAgentTier, } from '../pipeline/fleet-dispatch-bounds.js';
+// ADR-PIPELINE-109: repo-backed agent execution (Tier 1).
+import { isRepoAgentMode, hasRepoAgent, isDomainSourceCached, executeRepoAgent, } from '../agents/repo-agent-runner.js';
+// Per-agent sub-prompt wiring: inject each agent's hand-authored guidance
+// (agents/<domain>/<agent>/<agent>.md) + use case + prior run outputs into the
+// payload so it reaches the repo handler's callClaude prompt and the cloud tier.
+import { composeAgentExecutionContext, injectGuidanceIntoPayload, extractUseCase, getPriorAgentOutputs, recordAgentOutput, resetAgentRunContext, summarizeAgentResponse, } from '../agents/agent-prompts.js';
+const execFileAsync = promisify(execFile);
+/**
+ * ADR-PIPELINE-108 D3: resolve the `claude` binary once and memoize it.
+ * Avoids spawning `which`/`where` on every one of the ~109 fleet agents.
+ * Returns null when no claude binary is found (caller falls back to cloud).
+ */
+// ADR-PIPELINE-108 D3: fully async (no execFileSync on the fleet path) and
+// promise-memoized, so concurrent fleet agents trigger at most ONE `which`
+// resolution and the event loop is never blocked.
+let _claudeBinPromise;
+function resolveClaudeBin() {
+    if (_claudeBinPromise)
+        return _claudeBinPromise;
+    _claudeBinPromise = (async () => {
+        const envBin = process.env['AGENTICS_CLAUDE_BIN'];
+        if (envBin)
+            return envBin;
+        for (const candidate of ['claude', 'claude-code']) {
+            try {
+                const { stdout } = await execFileAsync(process.platform === 'win32' ? 'where' : 'which', [candidate], { encoding: 'utf-8', timeout: 5_000 });
+                const found = stdout.trim().split(/\r?\n/)[0]?.trim();
+                if (found)
+                    return found;
+            }
+            catch { /* not found — try next candidate */ }
+        }
+        return null;
+    })();
+    return _claudeBinPromise;
+}
+/**
+ * ADR-PIPELINE-108 D4: agents with a LOCAL execution path (claude --print) do
+ * not need a healthy cloud backend, so they are exempt from the preflight
+ * cloud-health skip and from breaker accounting. (copilot/* and
+ * inference-gateway/route run locally via Claude Max — ADR-066.)
+ */
+function isLocallyServable(domain, agent) {
+    if (domain === 'copilot')
+        return true;
+    if (domain === 'inference-gateway' && agent === 'route')
+        return true;
+    return false;
+}
+/**
+ * ADR-PIPELINE-108 D1/D2: invoke ONE fleet agent with a per-agent timeout and
+ * cloud circuit breaker. NEVER rejects — always resolves to a result object so
+ * the fleet's allSettled / partial-snapshot logic stays clean.
+ */
+async function boundedFleetInvoke(domain, agent, query, options, correlationId, breaker, perAgentMs) {
+    const id = `${domain}/${agent}`;
+    const local = isLocallyServable(domain, agent);
+    // D2: once the breaker has tripped, skip remaining cloud agents instead of
+    // each eating its full per-agent timeout. Local-capable agents still run.
+    if (!local && breaker.shouldSkip()) {
+        return { kind: 'agent', domain, agent, status: 0, response: { _breaker_skipped: true, reason: 'cloud-breaker-tripped' } };
+    }
+    try {
+        const payload = buildDomainPayload(domain, agent, query, correlationId);
+        // D1: race the invocation against the per-agent deadline.
+        const raced = await withAgentTimeout(executeAgentsInvokeCommand(domain, agent, payload, options), perAgentMs);
+        if (raced === AGENT_TIMED_OUT) {
+            if (!local)
+                breaker.record(true, 'cloud', id);
+            return { kind: 'agent', domain, agent, status: 504, response: { _timeout: true, error: `agent ${id} timed out after ${perAgentMs}ms` } };
+        }
+        const result = raced; // narrowed to AgentsInvokeResult after the sentinel check
+        const respObj = result.response && typeof result.response === 'object' ? result.response : undefined;
+        const isFallback = respObj?.['_fallback'] === true;
+        const failed = (result.status ?? 200) >= 400;
+        if (!local)
+            breaker.record(failed, isFallback ? 'local' : 'cloud', id);
+        // ADR-PIPELINE-109 D5: carry the execution tier that served this agent.
+        const tier = classifyExecutionTier(result);
+        // Record this agent's output into the run-scoped accumulator so later agents
+        // dispatched in this run can review what was already produced.
+        recordAgentOutput({
+            domain,
+            agent,
+            status: result.status ?? 200,
+            tier,
+            summary: summarizeAgentResponse(result.response),
+        });
+        return { kind: 'agent', domain, agent, status: result.status ?? 200, response: result.response, execution_tier: tier };
+    }
+    catch (err) {
+        if (!local)
+            breaker.record(true, 'cloud', id);
+        return { kind: 'agent', domain, agent, status: 502, response: { error: err instanceof Error ? err.message : String(err) } };
+    }
+}
+/**
+ * ADR-PIPELINE-109 D5: one-line provenance summary — how many fleet agents were
+ * served by each tier. `unavailable` = breaker-skipped / timed-out / errored
+ * (no content), which carry no tier.
+ */
+function summarizeTiers(results) {
+    let repo = 0, cloud = 0, synthetic = 0, unavailable = 0;
+    for (const r of results) {
+        if (r.execution_tier === 'repo')
+            repo++;
+        else if (r.execution_tier === 'cloud')
+            cloud++;
+        else if (r.execution_tier === 'synthetic')
+            synthetic++;
+        else
+            unavailable++;
+    }
+    return `${repo} repo · ${cloud} cloud · ${synthetic} synthetic` + (unavailable ? ` · ${unavailable} unavailable` : '');
+}
+/**
+ * ADR-PIPELINE-108 D4: probe fleet backends and return the set of
+ * `domain/agent` ids to skip (unhealthy cloud backend, no local path). Never
+ * throws — a probe failure returns an empty skip set (dispatch everything).
+ * Does NOT abort the fleet (unlike the Phase 2 preflight's abort verdict):
+ * Phase 1 is the entry point, so we degrade rather than halt.
+ */
+async function fleetPreflightSkipSet(refs, traceId) {
+    try {
+        const { runPhase2Preflight } = await import('../pipeline/phase2-preflight.js');
+        const cloudRefs = refs
+            // ADR-PIPELINE-109 D5 ↔ ADR-108 D4: agents served locally (claude path) or
+            // by their repo tier do not need a healthy cloud backend — don't probe them.
+            .filter((r) => !isLocallyServable(r.domain, r.agent) && resolveAgentTier(r.domain) !== 'repo')
+            .map((r) => ({ domain: r.domain, agent: r.agent, service: `${r.domain}-agents` }));
+        if (cloudRefs.length === 0)
+            return new Set();
+        const pf = await runPhase2Preflight(cloudRefs, traceId);
+        console.error(`  [PREFLIGHT] ${pf.healthy.length}/${pf.probed} fleet backends healthy in ${pf.durationMs}ms (verdict: ${pf.verdict})`);
+        if (pf.skipped.length > 0) {
+            console.error(`  [PREFLIGHT] Skipping ${pf.skipped.length} agents on unhealthy backends: ${pf.unhealthy.join(', ')}`);
+        }
+        return new Set(pf.skipped);
+    }
+    catch (err) {
+        console.error(`  [PREFLIGHT] probe skipped (error: ${err instanceof Error ? err.message : String(err)}) — dispatching full fleet`);
+        return new Set();
+    }
+}
+/**
+ * ADR-PIPELINE-108 D5: persist the effective fleet-dispatch config + Phase 1
+ * verdict. Writes a DEDICATED `fleet-dispatch.json` artifact (which later
+ * pipeline phases never rewrite — unlike the shared `manifest.json`, which
+ * Phases 2–7 overwrite) and ALSO best-effort patches `manifest.json`. Never
+ * throws — observability must not fail the pipeline.
+ */
+function persistFleetDispatch(runDir, record, verdict) {
+    try {
+        // 1) Dedicated, stable artifact — the authoritative D5 record. Written
+        //    SYNCHRONOUSLY (no await) so no event-loop yield can interleave or be
+        //    interrupted before the write lands.
+        fsWriteFileSync(pathJoin(runDir, 'fleet-dispatch.json'), JSON.stringify(record, null, 2), 'utf-8');
+        // 2) Best-effort manifest patch (may be overwritten by later phases).
+        const mPath = pathJoin(runDir, 'manifest.json');
+        if (fsExistsSync(mPath)) {
+            const m = JSON.parse(fsReadFileSync(mPath, 'utf-8'));
+            m['phase1_verdict'] = verdict.verdict;
+            m['phase1_reason'] = verdict.reason;
+            m['phase1_degradations'] = verdict.degradations;
+            m['phase1_stats'] = verdict.stats;
+            m['fleet_dispatch'] = record;
+            fsWriteFileSync(mPath, JSON.stringify(m, null, 2), 'utf-8');
+        }
+    }
+    catch { /* non-fatal */ }
+}
 // ============================================================================
 // ADR-066: Copilot agents via claude --print (Claude Max — no API key needed)
 // ============================================================================
@@ -30,31 +206,17 @@ const COPILOT_PROMPTS = {
     'meta-reasoner': 'You are a meta-reasoning agent. Analyze the reasoning traces and identify optimization opportunities. Return JSON: { insights: [], optimizations: [], confidence: number }',
 };
 async function runCopilotViaClaudeMax(agent, payload, correlationId) {
-    // Find claude binary
-    let claudeBin = null;
-    const envBin = process.env['AGENTICS_CLAUDE_BIN'];
-    if (envBin) {
-        claudeBin = envBin;
-    }
-    else {
-        for (const candidate of ['claude', 'claude-code']) {
-            try {
-                const found = execFileSync(process.platform === 'win32' ? 'where' : 'which', [candidate], { stdio: ['pipe', 'pipe', 'pipe'], timeout: 5_000, encoding: 'utf-8' }).trim().split(/\r?\n/)[0]?.trim();
-                if (found) {
-                    claudeBin = found;
-                    break;
-                }
-            }
-            catch { /* not found */ }
-        }
-    }
+    // ADR-PIPELINE-108 D3: memoized binary resolution (no per-agent `which`).
+    const claudeBin = await resolveClaudeBin();
     if (!claudeBin)
         return null; // claude not available — fall through to cloud function
     const systemPrompt = COPILOT_PROMPTS[agent] ?? `You are a ${agent} agent. Analyze the following and return structured JSON.`;
     const query = String(payload['objective'] ?? payload['text'] ?? payload['query'] ?? JSON.stringify(payload));
     const fullPrompt = `${systemPrompt}\n\nInput:\n${query}\n\nReturn ONLY valid JSON, no markdown fences.`;
     try {
-        const rawOutput = execFileSync(claudeBin, [
+        // ADR-PIPELINE-108 D3: async exec — does NOT block the event loop, so the
+        // ~109-agent fleet runs concurrently instead of serializing behind this call.
+        const { stdout: rawOutput } = await execFileAsync(claudeBin, [
             '--print',
             '--output-format', 'text',
             '--model', process.env['AGENTICS_CLAUDE_MODEL'] || 'claude-sonnet-4-20250514',
@@ -63,7 +225,6 @@ async function runCopilotViaClaudeMax(agent, payload, correlationId) {
             encoding: 'utf-8',
             timeout: 60_000,
             maxBuffer: 5 * 1024 * 1024,
-            stdio: ['pipe', 'pipe', 'pipe'],
             env: { ...process.env, MCP_SERVER_MODE: undefined },
         });
         // Parse JSON from output
@@ -102,23 +263,8 @@ async function runCopilotViaClaudeMax(agent, payload, correlationId) {
 // for a request given hints). We run it locally through the user's Claude Max
 // session so no server-side Anthropic API key is required.
 async function runInferenceRoutingViaClaudeMax(payload, correlationId) {
-    let claudeBin = null;
-    const envBin = process.env['AGENTICS_CLAUDE_BIN'];
-    if (envBin) {
-        claudeBin = envBin;
-    }
-    else {
-        for (const candidate of ['claude', 'claude-code']) {
-            try {
-                const found = execFileSync(process.platform === 'win32' ? 'where' : 'which', [candidate], { stdio: ['pipe', 'pipe', 'pipe'], timeout: 5_000, encoding: 'utf-8' }).trim().split(/\r?\n/)[0]?.trim();
-                if (found) {
-                    claudeBin = found;
-                    break;
-                }
-            }
-            catch { /* not found */ }
-        }
-    }
+    // ADR-PIPELINE-108 D3: memoized binary resolution (no per-agent `which`).
+    const claudeBin = await resolveClaudeBin();
     if (!claudeBin)
         return null;
     const systemPrompt = [
@@ -144,7 +290,8 @@ async function runInferenceRoutingViaClaudeMax(payload, correlationId) {
     ].join('\n');
     const fullPrompt = `${systemPrompt}\n\nRequest:\n${JSON.stringify(payload, null, 2)}`;
     try {
-        const rawOutput = execFileSync(claudeBin, [
+        // ADR-PIPELINE-108 D3: async exec — non-blocking.
+        const { stdout: rawOutput } = await execFileAsync(claudeBin, [
             '--print',
             '--output-format', 'text',
             '--model', process.env['AGENTICS_CLAUDE_MODEL'] || 'claude-sonnet-4-20250514',
@@ -153,7 +300,6 @@ async function runInferenceRoutingViaClaudeMax(payload, correlationId) {
             encoding: 'utf-8',
             timeout: 60_000,
             maxBuffer: 5 * 1024 * 1024,
-            stdio: ['pipe', 'pipe', 'pipe'],
             env: { ...process.env, MCP_SERVER_MODE: undefined },
         });
         let cleaned = rawOutput.trim();
@@ -334,6 +480,38 @@ export const RESOLUTION_ONLY_DOMAINS = new Set([
 export function isResolutionOnlyDomain(domain) {
     return RESOLUTION_ONLY_DOMAINS.has(domain);
 }
+/**
+ * ADR-PIPELINE-109 D5: classify how a result was produced, for provenance.
+ * `repo` is set explicitly by the Tier-1 path; otherwise a `_fallback` marker
+ * means a locally-computed synthetic stub, and anything else is a real cloud
+ * (or local-claude, ADR-066) response.
+ */
+export function classifyExecutionTier(result) {
+    if (result.execution_tier)
+        return result.execution_tier;
+    const resp = result.response;
+    if (resp && typeof resp === 'object' && resp['_fallback'] === true) {
+        return 'synthetic';
+    }
+    return 'cloud';
+}
+/**
+ * ADR-PIPELINE-109 D3/D4: decide whether to route an agent to the repo tier or
+ * the cloud tier. `AGENTICS_AGENT_TIER` forces a tier; the default `auto`
+ * prefers repo when the domain is repo-eligible (claude available + a repo
+ * mapping + source actually cached — D2), else cloud. A `forced` repo tier
+ * skips the source-cache gate so `executeRepoAgent` can provision on demand.
+ */
+export function resolveAgentTier(domain) {
+    // Pure decision lives in fleet-dispatch-bounds (unit-testable); here we feed
+    // it the live predicates from the repo-agent runtime.
+    return decideAgentTier({
+        forced: process.env['AGENTICS_AGENT_TIER'],
+        hasRepo: hasRepoAgent(domain),
+        repoMode: isRepoAgentMode(),
+        sourceCached: isDomainSourceCached(domain),
+    });
+}
 // ============================================================================
 // Command Implementations
 // ============================================================================
@@ -416,7 +594,43 @@ export async function executeAgentsInvokeCommand(domain, agent, payload, options
             }
         }
     }
-    // Go directly to Cloud Run services — no repo-local fallback chain
+    // Per-agent sub-prompt wiring: prepend the agent's hand-authored guidance
+    // (agents/<domain>/<agent>/<agent>.md), the run's use case, and any outputs
+    // already produced earlier in this run onto the payload text. This reaches the
+    // repo handler's callClaude userMessage (Tier 1) and persists into the cloud
+    // fallback payload (Tier 2), so the sub-prompt's "execute your repo code,
+    // review the use case, review prior outputs" instruction is actually applied.
+    if (normalizedPayload && typeof normalizedPayload === 'object') {
+        const payloadObj = normalizedPayload;
+        const guidance = composeAgentExecutionContext({
+            domain,
+            agent,
+            useCase: extractUseCase(payloadObj),
+            priorOutputs: getPriorAgentOutputs(),
+        });
+        if (guidance) {
+            normalizedPayload = injectGuidanceIntoPayload(payloadObj, guidance);
+        }
+    }
+    // ADR-PIPELINE-109 D3/D4: Tier 1 — run the agent's REAL repo code (its actual
+    // handler + system prompts) via claude --print. Chosen when the domain is
+    // repo-eligible (D2 cache gate) or forced via AGENTICS_AGENT_TIER=repo. On any
+    // non-2xx (auth/provision/handler failure) we degrade to the cloud tier (D6),
+    // visibly — never silently presenting a synthetic stub as repo output.
+    if (resolveAgentTier(domain) === 'repo') {
+        const repoResult = await executeRepoAgent(domain, agent, normalizedPayload, correlationId);
+        if (repoResult.status >= 200 && repoResult.status < 300) {
+            // Preserve the tier executeRepoAgent set: 'repo' only for a genuine
+            // handler run; its internal system-prompt / rust-native fallbacks
+            // self-tag 'synthetic' so provenance is not inflated (ADR-109 D5).
+            return { ...repoResult, execution_tier: repoResult.execution_tier ?? 'repo' };
+        }
+        const reason = (repoResult.response && typeof repoResult.response === 'object'
+            ? repoResult.response['error']
+            : undefined) ?? `status ${repoResult.status}`;
+        console.error(`  [TIER] ${domain}/${agent} repo tier unavailable (${String(reason).slice(0, 80)}) — degrading to cloud`);
+    }
+    // Tier 2: Cloud Run services (Tier 3 synthetic fallback computed on failure).
     const config = loadEndpointConfig(domainConfig.serviceName);
     const adapter = createAdapter(domainConfig.serviceName, config, correlationId);
     // ADR-066: Copilot agents run via claude --print (Claude Max) — no API key needed
@@ -3845,40 +4059,36 @@ export async function executeNaturalLanguageRoute(query, options) {
                     console.error(`  [RUVECTOR] Simulation failed after ${MAX_RETRIES + 1} attempts: ${lastErr?.message ?? 'unknown error'}`);
                     return { kind: 'simulation', domain: 'simulator', agent: 'enterprise', status: 502, response: { error: lastErr?.message ?? 'Enterprise simulation failed after retries' } };
                 })();
-                // Dispatch graph-selected agents in parallel
-                const REPO_LOCAL_DOMAINS = new Set(['copilot']);
-                const prevLocalAgents = process.env['AGENTICS_LOCAL_AGENTS'];
-                console.error(`  Dispatching ${graphResult.agents.length} graph-routed agents...`);
-                const agentPromises = [];
-                for (const ref of graphResult.agents) {
-                    agentPromises.push((async () => {
-                        try {
-                            if (!REPO_LOCAL_DOMAINS.has(ref.domain)) {
-                                process.env['AGENTICS_LOCAL_AGENTS'] = 'false';
-                            }
-                            else if (prevLocalAgents !== undefined) {
-                                process.env['AGENTICS_LOCAL_AGENTS'] = prevLocalAgents;
-                            }
-                            else {
-                                delete process.env['AGENTICS_LOCAL_AGENTS'];
-                            }
-                            const payload = buildDomainPayload(ref.domain, ref.agent, query, correlationId);
-                            const result = await executeAgentsInvokeCommand(ref.domain, ref.agent, payload, options);
-                            return { kind: 'agent', domain: ref.domain, agent: ref.agent, status: result.status ?? 200, response: result.response };
-                        }
-                        catch (err) {
-                            return { kind: 'agent', domain: ref.domain, agent: ref.agent, status: 502, response: { error: err instanceof Error ? err.message : String(err) } };
-                        }
-                    })());
-                }
-                const allResults = await Promise.allSettled([Promise.resolve(simResult), ...agentPromises]);
+                // ADR-PIPELINE-108 D1/D2/D4 — bounded, non-blocking graph-routed dispatch
+                // (same discipline as the full-fleet path: per-agent timeout + breaker +
+                // preflight skip; no racy per-agent process.env toggling).
+                // Start each `agentics ask` run with an empty prior-output accumulator so
+                // agents only see outputs from THIS run (matters in the long-lived MCP
+                // server; harmless in the short-lived CLI process).
+                resetAgentRunContext();
+                const fleetCfg = resolveFleetDispatchConfig();
+                const fleetBreaker = new CloudCircuitBreaker(fleetCfg.cloud_breaker_threshold);
+                const fleetSkip = await fleetPreflightSkipSet(graphResult.agents, correlationId);
+                const dispatchAgents = graphResult.agents.filter((a) => !fleetSkip.has(`${a.domain}/${a.agent}`));
+                const fleetPreflightSkipped = graphResult.agents.length - dispatchAgents.length;
+                console.error(`  Dispatching ${dispatchAgents.length} graph-routed agents (preflight-skipped ${fleetPreflightSkipped})...`);
+                const completedFleet = [];
+                const agentPromises = dispatchAgents.map((ref) => boundedFleetInvoke(ref.domain, ref.agent, query, options, correlationId, fleetBreaker, fleetCfg.agent_timeout_ms)
+                    .then((r) => { completedFleet.push(r); return r; }));
+                // D2: fleet-wide deadline.
+                const settledOrTimeout = await raceFleetDeadline(Promise.allSettled([Promise.resolve(simResult), ...agentPromises]), fleetCfg.fleet_timeout_ms);
                 const elapsed = Date.now() - start;
-                // Restore repo-local mode
-                if (prevLocalAgents !== undefined) {
-                    process.env['AGENTICS_LOCAL_AGENTS'] = prevLocalAgents;
+                console.error(`  [TIER] execution: ${summarizeTiers(completedFleet)}`);
+                let allResults;
+                if (settledOrTimeout === 'TIMEOUT') {
+                    allResults = [
+                        { status: 'fulfilled', value: simResult },
+                        ...completedFleet.map((v) => ({ status: 'fulfilled', value: v })),
+                    ];
+                    console.error(`  [FLEET] deadline ${fleetCfg.fleet_timeout_ms}ms hit — ${completedFleet.length}/${dispatchAgents.length} agents completed`);
                 }
                 else {
-                    delete process.env['AGENTICS_LOCAL_AGENTS'];
+                    allResults = settledOrTimeout;
                 }
                 // Build multi-result response
                 const intents = [];
@@ -3927,7 +4137,7 @@ export async function executeNaturalLanguageRoute(query, options) {
                         executionId: correlationId,
                         query,
                         simulationResult: simulationData,
-                        platformAnalysis: agentResults.map(p => ({ domain: p.domain, agent: p.agent, status: p.status, response: p.response })),
+                        platformAnalysis: agentResults.map(p => ({ domain: p.domain, agent: p.agent, status: p.status, response: p.response, execution_tier: p.execution_tier })),
                         correlationId,
                         timing: elapsed,
                     });
@@ -3951,25 +4161,18 @@ export async function executeNaturalLanguageRoute(query, options) {
                 // leaking state into subsequent runs (tests, daemons).
                 const degradations = drainDegradations(correlationId);
                 const phase1Verdict = computePhase1Verdict(invocations, degradations, artifactFilesGraphRouted);
-                // ADR-PIPELINE-089 §2: patch verdict into manifest.json so
-                // downstream phases (and `agentics status`) can read it without
-                // keeping state in memory. Best-effort; manifest may not exist if
-                // the artifact generator itself threw.
+                // ADR-PIPELINE-089 §2 + ADR-PIPELINE-108 D5: persist verdict + dispatch
+                // bounds (dedicated fleet-dispatch.json + best-effort manifest patch).
                 if (artifactRunDirGraphRouted) {
-                    try {
-                        const fsMod = await import('node:fs');
-                        const pathMod = await import('node:path');
-                        const mPath = pathMod.join(artifactRunDirGraphRouted, 'manifest.json');
-                        if (fsMod.existsSync(mPath)) {
-                            const m = JSON.parse(fsMod.readFileSync(mPath, 'utf-8'));
-                            m['phase1_verdict'] = phase1Verdict.verdict;
-                            m['phase1_reason'] = phase1Verdict.reason;
-                            m['phase1_degradations'] = phase1Verdict.degradations;
-                            m['phase1_stats'] = phase1Verdict.stats;
-                            fsMod.writeFileSync(mPath, JSON.stringify(m, null, 2), 'utf-8');
-                        }
-                    }
-                    catch { /* non-fatal */ }
+                    persistFleetDispatch(artifactRunDirGraphRouted, {
+                        ...fleetCfg,
+                        dispatched: dispatchAgents.length,
+                        total: graphResult.agents.length,
+                        preflight_skipped: fleetPreflightSkipped,
+                        breaker_tripped: fleetBreaker.state().tripped,
+                        breaker_after_n_timeouts: fleetBreaker.state().after_n_timeouts,
+                        elapsed_ms: elapsed,
+                    }, phase1Verdict);
                 }
                 // One-line verdict banner — visible on the terminal and captured by
                 // the MCP tool wrapper for status surfacing.
@@ -4205,59 +4408,56 @@ export async function executeNaturalLanguageRoute(query, options) {
             console.error(`  [RUVECTOR] Simulation failed after ${MAX_RETRIES + 1} attempts: ${lastErr?.message ?? 'unknown error'}`);
             return { kind: 'simulation', domain: 'simulator', agent: 'enterprise', status: 502, response: { error: lastErr?.message ?? 'Enterprise simulation failed after retries' } };
         })();
-        // For fleet dispatch, skip repo-local mode (which downloads source from GCS and
-        // spawns subprocesses) to go directly to the deployed cloud functions. This
-        // eliminates contention from 109 concurrent GCS downloads.
-        // Exception: copilot agents require repo-local because the cloud function needs
-        // an Anthropic API key that only the repo-local shim can provide.
-        const REPO_LOCAL_DOMAINS = new Set(['copilot']);
-        const prevLocalAgents = process.env['AGENTICS_LOCAL_AGENTS'];
-        // Dispatch fleet agents in staggered waves to reduce GCF cold-start pressure.
-        // Wave size of 15 agents with 2s delay between waves gives functions time to warm.
+        // ADR-PIPELINE-108 D1/D2/D4/D5 — bounded, non-blocking fleet dispatch.
+        // Per-agent timeout + cloud circuit breaker + preflight skip, so the
+        // fleet cannot stall on the slowest of ~109 cloud calls. No per-agent
+        // process.env toggling (it was racy under concurrency, and
+        // executeAgentsInvokeCommand no longer branches on repo mode).
+        const fleetCfg = resolveFleetDispatchConfig();
+        const fleetBreaker = new CloudCircuitBreaker(fleetCfg.cloud_breaker_threshold);
+        // D4: skip agents whose cloud backend is already unhealthy. Locally-served
+        // agents (copilot/*, inference-gateway/route) are never skipped.
+        const fleetSkip = await fleetPreflightSkipSet(fleetAgents, correlationId);
+        const dispatchAgents = fleetAgents.filter((a) => !fleetSkip.has(`${a.domain}/${a.agent}`));
+        const fleetPreflightSkipped = fleetAgents.length - dispatchAgents.length;
+        // Dispatch in staggered waves to reduce GCF cold-start pressure.
         const WAVE_SIZE = 15;
         const WAVE_DELAY_MS = 2000;
+        const completedFleet = [];
         const agentPromises = [];
-        for (let i = 0; i < fleetAgents.length; i += WAVE_SIZE) {
-            const wave = fleetAgents.slice(i, i + WAVE_SIZE);
+        for (let i = 0; i < dispatchAgents.length; i += WAVE_SIZE) {
+            const wave = dispatchAgents.slice(i, i + WAVE_SIZE);
             const waveNum = Math.floor(i / WAVE_SIZE) + 1;
-            const totalWaves = Math.ceil(fleetAgents.length / WAVE_SIZE);
+            const totalWaves = Math.ceil(dispatchAgents.length / WAVE_SIZE);
             console.error(`  Wave ${waveNum}/${totalWaves}: ${wave.length} agents (${wave.map(a => `${a.domain}/${a.agent}`).slice(0, 3).join(', ')}${wave.length > 3 ? '...' : ''})`);
             for (const { domain, agent } of wave) {
-                agentPromises.push((async () => {
-                    try {
-                        // Toggle repo-local per-agent: only copilot uses repo-local
-                        if (!REPO_LOCAL_DOMAINS.has(domain)) {
-                            process.env['AGENTICS_LOCAL_AGENTS'] = 'false';
-                        }
-                        else if (prevLocalAgents !== undefined) {
-                            process.env['AGENTICS_LOCAL_AGENTS'] = prevLocalAgents;
-                        }
-                        else {
-                            delete process.env['AGENTICS_LOCAL_AGENTS'];
-                        }
-                        const payload = buildDomainPayload(domain, agent, query, correlationId);
-                        const result = await executeAgentsInvokeCommand(domain, agent, payload, options);
-                        return { kind: 'agent', domain, agent, status: result.status ?? 200, response: result.response };
-                    }
-                    catch (err) {
-                        return { kind: 'agent', domain, agent, status: 502, response: { error: err instanceof Error ? err.message : String(err) } };
-                    }
-                })());
+                agentPromises.push(boundedFleetInvoke(domain, agent, query, options, correlationId, fleetBreaker, fleetCfg.agent_timeout_ms)
+                    .then((r) => { completedFleet.push(r); return r; }));
             }
             // Stagger between waves (skip delay on last wave)
-            if (i + WAVE_SIZE < fleetAgents.length) {
+            if (i + WAVE_SIZE < dispatchAgents.length) {
                 await new Promise(resolve => setTimeout(resolve, WAVE_DELAY_MS));
             }
         }
-        const allResults = await Promise.allSettled([Promise.resolve(simResult), ...agentPromises]);
+        // D2: fleet-wide deadline — collect partial results rather than hang on
+        // any still-pending agent. boundedFleetInvoke never rejects, so the
+        // completedFleet snapshot is authoritative on timeout.
+        const settledOrTimeout = await raceFleetDeadline(Promise.allSettled([Promise.resolve(simResult), ...agentPromises]), fleetCfg.fleet_timeout_ms);
         const elapsed = Date.now() - start;
-        // Restore repo-local mode setting
-        if (prevLocalAgents !== undefined) {
-            process.env['AGENTICS_LOCAL_AGENTS'] = prevLocalAgents;
+        let allResults;
+        if (settledOrTimeout === 'TIMEOUT') {
+            allResults = [
+                { status: 'fulfilled', value: simResult },
+                ...completedFleet.map((v) => ({ status: 'fulfilled', value: v })),
+            ];
+            console.error(`  [FLEET] deadline ${fleetCfg.fleet_timeout_ms}ms hit — ${completedFleet.length}/${dispatchAgents.length} agents completed`);
         }
         else {
-            delete process.env['AGENTICS_LOCAL_AGENTS'];
+            allResults = settledOrTimeout;
         }
+        const fleetBreakerState = fleetBreaker.state();
+        console.error(`  [FLEET] dispatched ${dispatchAgents.length}/${fleetAgents.length} in ${(elapsed / 1000).toFixed(1)}s (preflight-skipped ${fleetPreflightSkipped}; breaker ${fleetBreakerState.tripped ? `TRIPPED after ${fleetBreakerState.after_n_timeouts}` : 'ok'}; bounds per-agent=${fleetCfg.agent_timeout_ms}ms fleet=${fleetCfg.fleet_timeout_ms}ms)`);
+        console.error(`  [TIER] execution: ${summarizeTiers(completedFleet)}`);
         // Build multi-result response from ALL agents
         const intents = [];
         const invocations = [];
@@ -4310,7 +4510,7 @@ export async function executeNaturalLanguageRoute(query, options) {
                 executionId: correlationId,
                 query,
                 simulationResult: simulationData,
-                platformAnalysis: agentResults.map(p => ({ domain: p.domain, agent: p.agent, status: p.status, response: p.response })),
+                platformAnalysis: agentResults.map(p => ({ domain: p.domain, agent: p.agent, status: p.status, response: p.response, execution_tier: p.execution_tier })),
                 correlationId,
                 timing: elapsed,
             });
@@ -4327,20 +4527,20 @@ export async function executeNaturalLanguageRoute(query, options) {
         const fleetDegradations = drainDegradations(correlationId);
         const fleetPhase1Verdict = computePhase1Verdict(invocations, fleetDegradations, artifactFilesFleet);
         if (artifactRunDirFleet) {
-            try {
-                const fsMod = await import('node:fs');
-                const pathMod = await import('node:path');
-                const mPath = pathMod.join(artifactRunDirFleet, 'manifest.json');
-                if (fsMod.existsSync(mPath)) {
-                    const m = JSON.parse(fsMod.readFileSync(mPath, 'utf-8'));
-                    m['phase1_verdict'] = fleetPhase1Verdict.verdict;
-                    m['phase1_reason'] = fleetPhase1Verdict.reason;
-                    m['phase1_degradations'] = fleetPhase1Verdict.degradations;
-                    m['phase1_stats'] = fleetPhase1Verdict.stats;
-                    fsMod.writeFileSync(mPath, JSON.stringify(m, null, 2), 'utf-8');
-                }
-            }
-            catch { /* non-fatal */ }
+            // ADR-PIPELINE-108 D5: record the effective dispatch bounds so a run's
+            // timing envelope is reproducible against the config in force. Written
+            // BOTH as a dedicated artifact (fleet-dispatch.json — never rewritten by
+            // later phases) and best-effort into manifest.json.
+            const fleetDispatchRecord = {
+                ...fleetCfg,
+                dispatched: dispatchAgents.length,
+                total: fleetAgents.length,
+                preflight_skipped: fleetPreflightSkipped,
+                breaker_tripped: fleetBreakerState.tripped,
+                breaker_after_n_timeouts: fleetBreakerState.after_n_timeouts,
+                elapsed_ms: elapsed,
+            };
+            persistFleetDispatch(artifactRunDirFleet, fleetDispatchRecord, fleetPhase1Verdict);
         }
         if (fleetPhase1Verdict.verdict !== 'healthy') {
             const label = fleetPhase1Verdict.verdict.toUpperCase();