npm - nemoris - Versions diffs - 0.1.0 → 0.1.2 - Mend

nemoris 0.1.0 → 0.1.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (248) hide show

package/.env.example +49 -49
package/LICENSE +21 -21
package/README.md +209 -209
package/SECURITY.md +59 -119
package/bin/nemoris +46 -46
package/config/agents/agent.toml.example +28 -28
package/config/agents/content.toml +23 -0
package/config/agents/default.toml +22 -22
package/config/agents/heartbeat.toml +35 -0
package/config/agents/iris.toml +23 -0
package/config/agents/lab.toml +23 -0
package/config/agents/main.toml +45 -0
package/config/agents/nemo.toml +21 -0
package/config/agents/ops.toml +38 -0
package/config/agents/orchestrator.toml +18 -18
package/config/agents/revenue.toml +23 -0
package/config/agents/testyboo.toml +19 -0
package/config/delivery.toml +73 -73
package/config/embeddings.toml +5 -5
package/config/identity/content-purpose.md +11 -0
package/config/identity/content-soul.md +45 -0
package/config/identity/default-purpose.md +1 -1
package/config/identity/default-soul.md +3 -3
package/config/identity/heartbeat-purpose.md +9 -0
package/config/identity/heartbeat-soul.md +16 -0
package/config/identity/iris-purpose.md +17 -0
package/config/identity/iris-soul.md +68 -0
package/config/identity/lab-purpose.md +10 -0
package/config/identity/lab-soul.md +38 -0
package/config/identity/main-purpose.md +17 -0
package/config/identity/main-soul.md +66 -0
package/config/identity/main-user.md +22 -0
package/config/identity/ops-purpose.md +9 -0
package/config/identity/ops-soul.md +16 -0
package/config/identity/orchestrator-purpose.md +1 -1
package/config/identity/orchestrator-soul.md +1 -1
package/config/identity/revenue-purpose.md +9 -0
package/config/identity/revenue-soul.md +41 -0
package/config/identity/testyboo-purpose.md +13 -0
package/config/identity/testyboo-soul.md +20 -0
package/config/improvement-targets.toml +15 -15
package/config/jobs/heartbeat-check.toml +30 -30
package/config/jobs/memory-rollup.toml +46 -46
package/config/jobs/workspace-health.toml +63 -63
package/config/mcp.toml +16 -16
package/config/output-contracts.toml +17 -17
package/config/peers.toml +32 -32
package/config/peers.toml.example +32 -32
package/config/policies/memory-default.toml +10 -10
package/config/policies/memory-heartbeat.toml +5 -5
package/config/policies/memory-ops.toml +10 -10
package/config/policies/tools-heartbeat-minimal.toml +8 -8
package/config/policies/tools-interactive-safe.toml +8 -8
package/config/policies/tools-ops-bounded.toml +8 -8
package/config/policies/tools-orchestrator.toml +7 -7
package/config/providers/anthropic.toml +15 -15
package/config/providers/ollama.toml +5 -5
package/config/providers/openai-codex.toml +9 -9
package/config/providers/openrouter.toml +5 -5
package/config/router.toml +22 -22
package/config/runtime.toml +114 -114
package/config/skills/self-improvement.toml +15 -15
package/config/skills/telegram-onboarding-spec.md +240 -240
package/config/skills/workspace-monitor.toml +15 -15
package/config/task-router.toml +42 -42
package/install.sh +50 -50
package/package.json +91 -90
package/src/auth/auth-profiles.js +169 -169
package/src/auth/openai-codex-oauth.js +285 -285
package/src/battle.js +449 -449
package/src/cli/help.js +265 -265
package/src/cli/output-filter.js +49 -49
package/src/cli/runtime-control.js +704 -704
package/src/cli-main.js +2763 -2763
package/src/cli.js +78 -78
package/src/config/loader.js +332 -332
package/src/config/schema-validator.js +214 -214
package/src/config/toml-lite.js +8 -8
package/src/daemon/action-handlers.js +71 -71
package/src/daemon/healing-tick.js +87 -87
package/src/daemon/health-probes.js +90 -90
package/src/daemon/notifier.js +57 -57
package/src/daemon/nurse.js +218 -218
package/src/daemon/repair-log.js +106 -106
package/src/daemon/rule-staging.js +90 -90
package/src/daemon/rules.js +29 -29
package/src/daemon/telegram-commands.js +54 -54
package/src/daemon/updater.js +85 -85
package/src/jobs/job-runner.js +78 -78
package/src/mcp/consumer.js +129 -129
package/src/memory/active-recall.js +171 -171
package/src/memory/backend-manager.js +97 -97
package/src/memory/backends/file-backend.js +38 -38
package/src/memory/backends/qmd-backend.js +219 -219
package/src/memory/embedding-guards.js +24 -24
package/src/memory/embedding-index.js +118 -118
package/src/memory/embedding-service.js +179 -179
package/src/memory/file-index.js +177 -177
package/src/memory/memory-signature.js +5 -5
package/src/memory/memory-store.js +648 -648
package/src/memory/retrieval-planner.js +66 -66
package/src/memory/scoring.js +145 -145
package/src/memory/simhash.js +78 -78
package/src/memory/sqlite-active-store.js +824 -824
package/src/memory/write-policy.js +36 -36
package/src/onboarding/aliases.js +33 -33
package/src/onboarding/auth/api-key.js +224 -224
package/src/onboarding/auth/ollama-detect.js +42 -42
package/src/onboarding/clack-prompter.js +77 -77
package/src/onboarding/doctor.js +530 -530
package/src/onboarding/lock.js +42 -42
package/src/onboarding/model-catalog.js +344 -344
package/src/onboarding/phases/auth.js +576 -589
package/src/onboarding/phases/build.js +130 -130
package/src/onboarding/phases/choose.js +82 -82
package/src/onboarding/phases/detect.js +98 -98
package/src/onboarding/phases/hatch.js +216 -216
package/src/onboarding/phases/identity.js +79 -79
package/src/onboarding/phases/ollama.js +345 -345
package/src/onboarding/phases/scaffold.js +99 -99
package/src/onboarding/phases/telegram.js +377 -377
package/src/onboarding/phases/validate.js +204 -204
package/src/onboarding/phases/verify.js +206 -206
package/src/onboarding/platform.js +482 -482
package/src/onboarding/status-bar.js +95 -95
package/src/onboarding/templates.js +794 -794
package/src/onboarding/toml-writer.js +38 -38
package/src/onboarding/tui.js +250 -250
package/src/onboarding/uninstall.js +153 -153
package/src/onboarding/wizard.js +516 -499
package/src/providers/anthropic.js +168 -168
package/src/providers/base.js +247 -247
package/src/providers/circuit-breaker.js +136 -136
package/src/providers/ollama.js +163 -163
package/src/providers/openai-codex.js +149 -149
package/src/providers/openrouter.js +136 -136
package/src/providers/registry.js +36 -36
package/src/providers/router.js +16 -16
package/src/runtime/bootstrap-cache.js +47 -47
package/src/runtime/capabilities-prompt.js +25 -25
package/src/runtime/completion-ping.js +99 -99
package/src/runtime/config-validator.js +121 -121
package/src/runtime/context-ledger.js +360 -360
package/src/runtime/cutover-readiness.js +42 -42
package/src/runtime/daemon.js +729 -729
package/src/runtime/delivery-ack.js +195 -195
package/src/runtime/delivery-adapters/local-file.js +41 -41
package/src/runtime/delivery-adapters/openclaw-cli.js +94 -94
package/src/runtime/delivery-adapters/openclaw-peer.js +98 -98
package/src/runtime/delivery-adapters/shadow.js +13 -13
package/src/runtime/delivery-adapters/standalone-http.js +98 -98
package/src/runtime/delivery-adapters/telegram.js +104 -104
package/src/runtime/delivery-adapters/tui.js +128 -128
package/src/runtime/delivery-manager.js +807 -807
package/src/runtime/delivery-store.js +168 -168
package/src/runtime/dependency-health.js +118 -118
package/src/runtime/envelope.js +114 -114
package/src/runtime/evaluation.js +1089 -1089
package/src/runtime/exec-approvals.js +216 -216
package/src/runtime/executor.js +500 -500
package/src/runtime/failure-ping.js +67 -67
package/src/runtime/flows.js +83 -83
package/src/runtime/guards.js +45 -45
package/src/runtime/handoff.js +51 -51
package/src/runtime/identity-cache.js +28 -28
package/src/runtime/improvement-engine.js +109 -109
package/src/runtime/improvement-harness.js +581 -581
package/src/runtime/input-sanitiser.js +72 -72
package/src/runtime/interaction-contract.js +347 -347
package/src/runtime/lane-readiness.js +226 -226
package/src/runtime/migration.js +323 -323
package/src/runtime/model-resolution.js +78 -78
package/src/runtime/network.js +64 -64
package/src/runtime/notification-store.js +97 -97
package/src/runtime/notifier.js +256 -256
package/src/runtime/orchestrator.js +53 -53
package/src/runtime/orphan-reaper.js +41 -41
package/src/runtime/output-contract-schema.js +139 -139
package/src/runtime/output-contract-validator.js +439 -439
package/src/runtime/peer-readiness.js +69 -69
package/src/runtime/peer-registry.js +133 -133
package/src/runtime/pilot-status.js +108 -108
package/src/runtime/prompt-builder.js +261 -261
package/src/runtime/provider-attempt.js +582 -582
package/src/runtime/report-fallback.js +71 -71
package/src/runtime/result-normalizer.js +183 -183
package/src/runtime/retention.js +74 -74
package/src/runtime/review.js +244 -244
package/src/runtime/route-job.js +15 -15
package/src/runtime/run-store.js +38 -38
package/src/runtime/schedule.js +88 -88
package/src/runtime/scheduler-state.js +434 -434
package/src/runtime/scheduler.js +656 -656
package/src/runtime/session-compactor.js +182 -182
package/src/runtime/session-search.js +155 -155
package/src/runtime/slack-inbound.js +249 -249
package/src/runtime/ssrf.js +102 -102
package/src/runtime/status-aggregator.js +330 -330
package/src/runtime/task-contract.js +140 -140
package/src/runtime/task-packet.js +107 -107
package/src/runtime/task-router.js +140 -140
package/src/runtime/telegram-inbound.js +1565 -1565
package/src/runtime/token-counter.js +134 -134
package/src/runtime/token-estimator.js +59 -59
package/src/runtime/tool-loop.js +200 -200
package/src/runtime/transport-server.js +311 -311
package/src/runtime/tui-server.js +411 -411
package/src/runtime/ulid.js +44 -44
package/src/security/ssrf-check.js +197 -197
package/src/setup.js +369 -369
package/src/shadow/bridge.js +303 -303
package/src/skills/loader.js +84 -84
package/src/tools/catalog.json +49 -49
package/src/tools/cli-delegate.js +44 -44
package/src/tools/mcp-client.js +106 -106
package/src/tools/micro/cancel-task.js +6 -6
package/src/tools/micro/complete-task.js +6 -6
package/src/tools/micro/fail-task.js +6 -6
package/src/tools/micro/http-fetch.js +74 -74
package/src/tools/micro/index.js +36 -36
package/src/tools/micro/lcm-recall.js +60 -60
package/src/tools/micro/list-dir.js +17 -17
package/src/tools/micro/list-skills.js +46 -46
package/src/tools/micro/load-skill.js +38 -38
package/src/tools/micro/memory-search.js +45 -45
package/src/tools/micro/read-file.js +11 -11
package/src/tools/micro/session-search.js +54 -54
package/src/tools/micro/shell-exec.js +43 -43
package/src/tools/micro/trigger-job.js +79 -79
package/src/tools/micro/web-search.js +58 -58
package/src/tools/micro/workspace-paths.js +39 -39
package/src/tools/micro/write-file.js +14 -14
package/src/tools/micro/write-memory.js +41 -41
package/src/tools/registry.js +348 -348
package/src/tools/tool-result-contract.js +36 -36
package/src/tui/chat.js +835 -835
package/src/tui/renderer.js +175 -175
package/src/tui/socket-client.js +217 -217
package/src/utils/canonical-json.js +29 -29
package/src/utils/compaction.js +30 -30
package/src/utils/env-loader.js +5 -5
package/src/utils/errors.js +80 -80
package/src/utils/fs.js +101 -101
package/src/utils/ids.js +5 -5
package/src/utils/model-context-limits.js +30 -30
package/src/utils/token-budget.js +74 -74
package/src/utils/usage-cost.js +25 -25
package/src/utils/usage-metrics.js +14 -14

package/src/runtime/provider-attempt.js CHANGED Viewed

@@ -1,582 +1,582 @@
-import { downloadTelegramFile } from "./telegram-inbound.js";
-import { ModelRouter } from "../providers/router.js";
-import { assertProviderExecutionAllowed } from "./guards.js";
-import { compileOutputContractSchema } from "./output-contract-schema.js";
-import { estimateInvocationTokens } from "./token-estimator.js";
-import { TokenCounter } from "./token-counter.js";
-import { classifyRuntimeFailure, getReportFallbackPolicy, resolveReportFallback } from "./report-fallback.js";
-import { extractUsageMetrics } from "../utils/usage-metrics.js";
-export function modelToProviderId(modelId) {
-  return String(modelId || "").split("/")[0] || null;
-}
-export function isRetryableError(err) {
-  const message = (err.message || "").toLowerCase();
-  const statusCode = err.statusCode || err.status || 0;
-  if (
-    message.includes("econnrefused") ||
-    message.includes("etimedout") ||
-    message.includes("fetch failed") ||
-    message.includes("net_error") ||
-    message.includes("timeout") ||
-    message.includes("enotfound") ||
-    message.includes("eai_again")
-  ) {
-    return true;
-  }
-  if (statusCode === 429 || (statusCode >= 500 && statusCode < 600)) {
-    return true;
-  }
-  return false;
-}
-export function computeProviderTimeoutMs(plan, providerConfig, options = {}) {
-  if (options.providerTimeoutMs != null) {
-    return Number(options.providerTimeoutMs);
-  }
-  const defaultTimeoutMs = Number(providerConfig?.defaultTimeoutMs || 0);
-  const budgetSeconds = Number(plan?.job?.budget?.maxRuntimeSeconds || 0);
-  const budgetTimeoutMs = budgetSeconds ? Math.min((budgetSeconds + 5) * 1000, 60000) : 0;
-  return Math.max(defaultTimeoutMs, budgetTimeoutMs || 0);
-}
-export function buildRoutingDecision(plan, options = {}) {
-  const routeMode = options.routeMode || plan.routing?.routeMode || "primary";
-  const selectedLane = options.laneOverride || plan.routing?.selectedLane || plan.job.modelLane;
-  return {
-    requestedLane: plan.job.modelLane,
-    selectedLane,
-    routeMode,
-    matchedRule: plan.routing?.matchedRule || null,
-    reasons: plan.routing?.reasons || [],
-    modelOverride: options.modelOverride || null
-  };
-}
-export function getLocalPromptContractOutputCap(plan, { providerId, providerCapabilities, routingDecision }) {
-  if (providerId !== "ollama") return null;
-  if (providerCapabilities?.structuredOutputMode !== "prompt_contract") return null;
-  const format = plan?.packet?.layers?.outputContract?.format || null;
-  if (format === "bulleted_briefing") return 1500;
-  if (format === "structured_rollup") return 2000;
-  if (routingDecision?.selectedLane === "local_cheap") return 400;
-  if (routingDecision?.selectedLane === "local_report") return 1200;
-  return null;
-}
-export async function prepareProviderAttempt({
-  plan,
-  runtimeConfig,
-  registry,
-  tokenCounter,
-  modelId,
-  providerConfig,
-  providerId,
-  routingDecision,
-  providerTimeoutMs,
-  toolSchemas,
-  buildSystemPrompt,
-  buildUserMessage
-}) {
-  if (!providerConfig) {
-    throw new Error(`No provider config for model ${modelId}`);
-  }
-  const adapter = registry.create(providerConfig);
-  const providerCapabilities = adapter?.getCapabilities?.() || null;
-  const nativeStructuredOutput = Boolean(
-    adapter &&
-      plan.packet.layers.outputContract &&
-      typeof adapter.supportsNativeStructuredOutput === "function" &&
-      adapter.supportsNativeStructuredOutput()
-  );
-  const responseSchema = nativeStructuredOutput
-    ? compileOutputContractSchema(plan.packet.layers.outputContract, {
-        thoughtFirst: providerCapabilities?.supportsReasoningSchema === true
-      })
-    : null;
-  const localPromptContractCap = getLocalPromptContractOutputCap(plan, {
-    providerId,
-    providerCapabilities,
-    routingDecision
-  });
-  const effectiveMaxTokens = localPromptContractCap
-    ? Math.min(Number(plan.job.budget.maxTokens || 0) || 0, localPromptContractCap)
-    : plan.job.budget.maxTokens;
-  const invocation = {
-    model: modelId,
-    system: buildSystemPrompt(plan, {
-      nativeStructuredOutput,
-      responseSchema,
-      toolSchemas
-    }),
-    messages: [
-      {
-        role: "user",
-        content: buildUserMessage(plan, {
-          nativeStructuredOutput,
-          responseSchema
-        })
-      }
-    ],
-    maxTokens: effectiveMaxTokens,
-    responseSchema,
-    timeoutMs: providerTimeoutMs,
-    tools: toolSchemas?.length ? toolSchemas : undefined,
-    options:
-      providerId === "ollama"
-        ? {
-            num_predict: effectiveMaxTokens
-          }
-        : undefined
-  };
-  const thinkMode = plan?.packet?.thinkMode;
-  if (
-    thinkMode && thinkMode !== "off" &&
-    providerId === "anthropic" &&
-    process.env.ANTHROPIC_THINKING_ENABLED === "true"
-  ) {
-    const THINK_BUDGETS = { low: 1000, medium: 8000, high: 16000 };
-    const budget = THINK_BUDGETS[thinkMode] || 8000;
-    invocation.betas = [...(invocation.betas || []), "interleaved-thinking-2025-05-14"];
-    invocation.thinking = { type: "enabled", budget_tokens: budget };
-  }
-  const preflight = await buildPreflight(runtimeConfig, invocation, {
-    providerId,
-    adapter,
-    tokenCounter
-  });
-  if (preflight.pressure === "hard") {
-    throw new Error(
-      `Preflight blocked ${plan.job.id}: estimated prompt tokens ${preflight.estimatedPromptTokens} exceed hard limit ${preflight.hardLimit}`
-    );
-  }
-  return {
-    adapter,
-    providerCapabilities,
-    invocation,
-    preflight
-  };
-}
-export async function buildPreflight(runtimeConfig, invocation, options = {}) {
-  const contextTokens = runtimeConfig?.safety?.contextTokens ?? 32768;
-  const softRatio = runtimeConfig?.safety?.contextPressureSoftRatio ?? 0.72;
-  const hardRatio = runtimeConfig?.safety?.contextPressureHardRatio ?? 0.9;
-  const freshSessionOnHighPressure = runtimeConfig?.safety?.freshSessionOnHighPressure ?? true;
-  const snapshotBeforeCompaction = runtimeConfig?.safety?.snapshotBeforeCompaction ?? true;
-  const tokenCounter = options.tokenCounter || new TokenCounter();
-  const tokenEstimate = await tokenCounter.countInvocation({
-    providerId: options.providerId,
-    invocation,
-    adapter: options.adapter
-  });
-  const heuristicEstimate = tokenEstimate.mode === "heuristic" ? tokenEstimate.details : estimateInvocationTokens(invocation);
-  const estimatedPromptTokens = tokenEstimate.total;
-  const softLimit = Math.floor(contextTokens * softRatio);
-  const hardLimit = Math.floor(contextTokens * hardRatio);
-  let pressure = "low";
-  if (estimatedPromptTokens >= hardLimit) pressure = "hard";
-  else if (estimatedPromptTokens >= softLimit) pressure = "high";
-  return {
-    contextTokens,
-    estimatedPromptTokens,
-    tokenEstimate,
-    heuristicEstimate,
-    softLimit,
-    hardLimit,
-    pressure,
-    freshSessionRequired: pressure !== "low" && freshSessionOnHighPressure,
-    snapshotBeforeCompaction
-  };
-}
-async function attachVisionInputs(plan, runtimeConfig, invocation, providerCapabilities) {
-  if (!plan.packet?.imageRefs?.length || !invocation) {
-    return invocation;
-  }
-  if (providerCapabilities?.supportsVision) {
-    const tgConfig = runtimeConfig?.telegram;
-    const botToken = tgConfig?.botTokenEnv ? process.env[tgConfig.botTokenEnv] : null;
-    if (!botToken) {
-      console.warn(`[executor] imageRefs present but botToken not resolved from ${tgConfig?.botTokenEnv || "undefined env key"}`);
-      return invocation;
-    }
-    const imageBlocks = [];
-    for (const ref of plan.packet.imageRefs) {
-      const downloaded = await downloadTelegramFile(ref.fileId, botToken);
-      if (downloaded) {
-        imageBlocks.push({
-          type: "image",
-          source: {
-            type: "base64",
-            media_type: downloaded.mediaType,
-            data: downloaded.base64,
-          },
-        });
-      }
-    }
-    if (imageBlocks.length > 0) {
-      const userIdx = invocation.messages.findLastIndex((message) => message.role === "user");
-      if (userIdx !== -1) {
-        const textContent = invocation.messages[userIdx].content;
-        invocation.messages[userIdx].content = [
-          ...imageBlocks,
-          { type: "text", text: textContent },
-        ];
-      }
-    }
-    return invocation;
-  }
-  const visionNote = "[Image received but this model doesn't support vision]";
-  const userIdx = invocation.messages.findLastIndex((message) => message.role === "user");
-  if (userIdx !== -1) {
-    const existing = invocation.messages[userIdx].content;
-    invocation.messages[userIdx].content = existing
-      ? `${existing}\n\n${visionNote}`
-      : visionNote;
-  }
-  return invocation;
-}
-function annotateAttemptError(error, metadata = {}) {
-  if (!error || typeof error !== "object") {
-    return error;
-  }
-  Object.assign(error, metadata);
-  return error;
-}
-async function executeProviderCall({
-  plan,
-  runtime,
-  mode,
-  registry,
-  tokenCounter,
-  modelId,
-  providerId,
-  providerConfig,
-  routingDecision,
-  providerTimeoutMs,
-  toolSchemas,
-  buildSystemPrompt,
-  buildUserMessage,
-  onPrepared
-}) {
-  let prepared = null;
-  let invocation = null;
-  try {
-    prepared = await prepareProviderAttempt({
-      plan,
-      runtimeConfig: runtime.runtime,
-      registry,
-      tokenCounter,
-      modelId,
-      providerConfig,
-      providerId,
-      routingDecision,
-      providerTimeoutMs,
-      toolSchemas,
-      buildSystemPrompt,
-      buildUserMessage
-    });
-    if (typeof onPrepared === "function") {
-      onPrepared(prepared);
-    }
-    invocation = await attachVisionInputs(
-      plan,
-      runtime.runtime,
-      prepared.invocation,
-      prepared.providerCapabilities
-    );
-    if (mode === "dry-run") {
-      return {
-        response: null,
-        providerId,
-        modelId,
-        usage: {
-          tokensIn: 0,
-          tokensOut: 0,
-          cacheIn: 0,
-          cacheCreation: 0,
-        },
-        cached: false,
-        adapter: prepared.adapter,
-        providerCapabilities: prepared.providerCapabilities,
-        invocation,
-        preflight: prepared.preflight,
-        providerModePolicy: null,
-        health: null,
-        toolLoopEnabled: false
-      };
-    }
-    const providerModePolicy = assertProviderExecutionAllowed({
-      jobId: plan.job.id,
-      modelLane: routingDecision.selectedLane,
-      providerId,
-      interactive: plan.job.trigger === "interactive"
-    });
-    let health = null;
-    if (providerModePolicy.requireHealthyProvider) {
-      const healthCheck = await prepared.adapter.healthCheck();
-      if (!healthCheck.ok) {
-        throw new Error(`Provider health check failed for ${providerId} with status ${healthCheck.status}`);
-      }
-      health = healthCheck;
-    }
-    const response = await prepared.adapter.invoke(invocation);
-    const usage = extractUsageMetrics(response);
-    return {
-      response,
-      providerId,
-      modelId,
-      usage,
-      cached: Boolean(usage.cacheIn || usage.cacheCreation),
-      adapter: prepared.adapter,
-      providerCapabilities: prepared.providerCapabilities,
-      invocation,
-      preflight: prepared.preflight,
-      providerModePolicy,
-      health,
-      toolLoopEnabled: true
-    };
-  } catch (error) {
-    throw annotateAttemptError(error, {
-      providerId,
-      modelId,
-      routingDecision,
-      providerCapabilities: prepared?.providerCapabilities || null,
-      invocation: invocation || prepared?.invocation || null,
-      preflight: prepared?.preflight || null
-    });
-  }
-}
-function buildFallbackState(runtimeConfig, routingDecision, providerId, modelId, options) {
-  return {
-    allowed: false,
-    attempted: false,
-    trigger: null,
-    finalSourceLane: routingDecision.selectedLane,
-    sourceLane: routingDecision.selectedLane,
-    sourceProviderId: providerId,
-    sourceModelId: modelId,
-    policy: getReportFallbackPolicy(runtimeConfig, options)
-  };
-}
-export async function attemptProvider({ plan, runtime, options = {} }) {
-  const mode = options.mode || "dry-run";
-  const router = options.router || new ModelRouter(runtime.router);
-  const routingDecision = buildRoutingDecision(plan, options);
-  const laneConfig = runtime.router?.[routingDecision.selectedLane];
-  const primaryModelId = options.modelOverride || plan.packet.modelOverride || router.resolve(routingDecision.selectedLane, routingDecision.routeMode);
-  const providersToTry = [primaryModelId, ...(laneConfig?.fallbackModels || [])];
-  const toolSchemas = options.toolSchemas || [];
-  const registry = options.registry;
-  const tokenCounter = options.tokenCounter;
-  const buildSystemPrompt = options.buildSystemPrompt;
-  const buildUserMessage = options.buildUserMessage;
-  let fallback = null;
-  let primaryError = null;
-  let lastProviderId = null;
-  for (const currentModelId of providersToTry) {
-    const currentProviderId = modelToProviderId(currentModelId);
-    const providerConfig = runtime.providers[currentProviderId];
-    const providerTimeoutMs = computeProviderTimeoutMs(plan, providerConfig, options);
-    const breaker = options.getBreaker?.(currentModelId, runtime.runtime) || null;
-    lastProviderId = currentProviderId;
-    if (breaker?.isOpen()) {
-      const retryAfter = breaker.retryAfter();
-      console.warn(`[Nemoris] circuit breaker open for ${currentModelId}, skipping (retry in ${Math.ceil(retryAfter)}s)`);
-      primaryError = new Error(`Provider ${currentModelId} circuit open — retry after ${Math.ceil(retryAfter)}s`);
-      annotateAttemptError(primaryError, {
-        providerId: currentProviderId,
-        modelId: currentModelId,
-        routingDecision,
-        fallback
-      });
-      continue;
-    }
-    try {
-      const attempt = await executeProviderCall({
-        plan,
-        runtime,
-        mode,
-        registry,
-        tokenCounter,
-        modelId: currentModelId,
-        providerId: currentProviderId,
-        providerConfig,
-        routingDecision,
-        providerTimeoutMs,
-        toolSchemas,
-        buildSystemPrompt,
-        buildUserMessage,
-        onPrepared: () => {
-          if (!fallback) {
-            fallback = buildFallbackState(runtime.runtime, routingDecision, currentProviderId, currentModelId, options);
-          }
-        }
-      });
-      if (mode === "provider") {
-        breaker?.recordSuccess();
-      }
-      return {
-        ...attempt,
-        routingDecision,
-        fallback,
-        primaryModelId
-      };
-    } catch (err) {
-      primaryError = annotateAttemptError(err, {
-        providerId: currentProviderId,
-        modelId: currentModelId,
-        routingDecision,
-        fallback
-      });
-      const statusCode = err.statusCode || err.status || 0;
-      breaker?.recordFailure(statusCode);
-      if (isRetryableError(err)) {
-        console.warn(`[executor] provider ${currentModelId} failed: ${err.message}, trying next`);
-        continue;
-      }
-      break;
-    }
-  }
-  if (!primaryError) {
-    primaryError = new Error("All providers in failover chain exhausted");
-    annotateAttemptError(primaryError, {
-      routingDecision,
-      fallback
-    });
-  }
-  const failureClass = classifyRuntimeFailure(primaryError?.message || "");
-  const fallbackResolution = resolveReportFallback({
-    runtimeConfig: runtime.runtime,
-    job: plan.job,
-    routingDecision,
-    providerId: lastProviderId,
-    failureClass,
-    options
-  });
-  fallback = {
-    ...(fallback || {}),
-    allowed: fallbackResolution.allowed,
-    attempted: false,
-    trigger: failureClass,
-    localFailureClass: failureClass,
-    localError: primaryError.message,
-    blockedReason: fallbackResolution.allowed ? null : fallbackResolution.reason,
-    targetLane: fallbackResolution.targetLane || null
-  };
-  if (!fallbackResolution.allowed) {
-    annotateAttemptError(primaryError, {
-      providerId: primaryError.providerId || lastProviderId,
-      routingDecision,
-      fallback
-    });
-    throw primaryError;
-  }
-  fallback.attempted = true;
-  const fallbackRoutingDecision = {
-    ...routingDecision,
-    selectedLane: fallbackResolution.targetLane,
-    routeMode: "fallback",
-    reasons: [...(routingDecision.reasons || []), `fallback:${failureClass}`],
-    description: "Failure-triggered report fallback."
-  };
-  const fallbackModelId = router.resolve(fallbackResolution.targetLane, "primary");
-  const fallbackProviderId = modelToProviderId(fallbackModelId);
-  const fallbackProviderConfig = runtime.providers[fallbackProviderId];
-  try {
-    const attempt = await executeProviderCall({
-      plan,
-      runtime,
-      mode,
-      registry,
-      tokenCounter,
-      modelId: fallbackModelId,
-      providerId: fallbackProviderId,
-      providerConfig: fallbackProviderConfig,
-      routingDecision: fallbackRoutingDecision,
-      providerTimeoutMs: computeProviderTimeoutMs(plan, fallbackProviderConfig, options),
-      toolSchemas,
-      buildSystemPrompt,
-      buildUserMessage
-    });
-    return {
-      ...attempt,
-      routingDecision: fallbackRoutingDecision,
-      fallback: {
-        ...fallback,
-        success: true,
-        finalSourceLane: fallbackRoutingDecision.selectedLane,
-        finalProviderId: fallbackProviderId,
-        finalModelId: fallbackModelId
-      },
-      toolLoopEnabled: mode === "provider" && Boolean(options.allowToolLoopOnFallback)
-    };
-  } catch (fallbackError) {
-    fallback = {
-      ...fallback,
-      success: false,
-      fallbackFailureClass: classifyRuntimeFailure(fallbackError?.message || ""),
-      fallbackError: fallbackError.message
-    };
-    const combinedError = new Error(
-      `Primary provider failed (${failureClass}) and fallback failed: ${fallbackError.message}`
-    );
-    annotateAttemptError(combinedError, {
-      providerId: fallbackProviderId,
-      modelId: fallbackModelId,
-      routingDecision: fallbackRoutingDecision,
-      providerCapabilities: fallbackError?.providerCapabilities || null,
-      invocation: fallbackError?.invocation || null,
-      preflight: fallbackError?.preflight || null,
-      fallback
-    });
-    throw combinedError;
-  }
-}
+import { downloadTelegramFile } from "./telegram-inbound.js";
+import { ModelRouter } from "../providers/router.js";
+import { assertProviderExecutionAllowed } from "./guards.js";
+import { compileOutputContractSchema } from "./output-contract-schema.js";
+import { estimateInvocationTokens } from "./token-estimator.js";
+import { TokenCounter } from "./token-counter.js";
+import { classifyRuntimeFailure, getReportFallbackPolicy, resolveReportFallback } from "./report-fallback.js";
+import { extractUsageMetrics } from "../utils/usage-metrics.js";
+export function modelToProviderId(modelId) {
+  return String(modelId || "").split("/")[0] || null;
+}
+export function isRetryableError(err) {
+  const message = (err.message || "").toLowerCase();
+  const statusCode = err.statusCode || err.status || 0;
+  if (
+    message.includes("econnrefused") ||
+    message.includes("etimedout") ||
+    message.includes("fetch failed") ||
+    message.includes("net_error") ||
+    message.includes("timeout") ||
+    message.includes("enotfound") ||
+    message.includes("eai_again")
+  ) {
+    return true;
+  }
+  if (statusCode === 429 || (statusCode >= 500 && statusCode < 600)) {
+    return true;
+  }
+  return false;
+}
+export function computeProviderTimeoutMs(plan, providerConfig, options = {}) {
+  if (options.providerTimeoutMs != null) {
+    return Number(options.providerTimeoutMs);
+  }
+  const defaultTimeoutMs = Number(providerConfig?.defaultTimeoutMs || 0);
+  const budgetSeconds = Number(plan?.job?.budget?.maxRuntimeSeconds || 0);
+  const budgetTimeoutMs = budgetSeconds ? Math.min((budgetSeconds + 5) * 1000, 60000) : 0;
+  return Math.max(defaultTimeoutMs, budgetTimeoutMs || 0);
+}
+export function buildRoutingDecision(plan, options = {}) {
+  const routeMode = options.routeMode || plan.routing?.routeMode || "primary";
+  const selectedLane = options.laneOverride || plan.routing?.selectedLane || plan.job.modelLane;
+  return {
+    requestedLane: plan.job.modelLane,
+    selectedLane,
+    routeMode,
+    matchedRule: plan.routing?.matchedRule || null,
+    reasons: plan.routing?.reasons || [],
+    modelOverride: options.modelOverride || null
+  };
+}
+export function getLocalPromptContractOutputCap(plan, { providerId, providerCapabilities, routingDecision }) {
+  if (providerId !== "ollama") return null;
+  if (providerCapabilities?.structuredOutputMode !== "prompt_contract") return null;
+  const format = plan?.packet?.layers?.outputContract?.format || null;
+  if (format === "bulleted_briefing") return 1500;
+  if (format === "structured_rollup") return 2000;
+  if (routingDecision?.selectedLane === "local_cheap") return 400;
+  if (routingDecision?.selectedLane === "local_report") return 1200;
+  return null;
+}
+export async function prepareProviderAttempt({
+  plan,
+  runtimeConfig,
+  registry,
+  tokenCounter,
+  modelId,
+  providerConfig,
+  providerId,
+  routingDecision,
+  providerTimeoutMs,
+  toolSchemas,
+  buildSystemPrompt,
+  buildUserMessage
+}) {
+  if (!providerConfig) {
+    throw new Error(`No provider config for model ${modelId}`);
+  }
+  const adapter = registry.create(providerConfig);
+  const providerCapabilities = adapter?.getCapabilities?.() || null;
+  const nativeStructuredOutput = Boolean(
+    adapter &&
+      plan.packet.layers.outputContract &&
+      typeof adapter.supportsNativeStructuredOutput === "function" &&
+      adapter.supportsNativeStructuredOutput()
+  );
+  const responseSchema = nativeStructuredOutput
+    ? compileOutputContractSchema(plan.packet.layers.outputContract, {
+        thoughtFirst: providerCapabilities?.supportsReasoningSchema === true
+      })
+    : null;
+  const localPromptContractCap = getLocalPromptContractOutputCap(plan, {
+    providerId,
+    providerCapabilities,
+    routingDecision
+  });
+  const effectiveMaxTokens = localPromptContractCap
+    ? Math.min(Number(plan.job.budget.maxTokens || 0) || 0, localPromptContractCap)
+    : plan.job.budget.maxTokens;
+  const invocation = {
+    model: modelId,
+    system: buildSystemPrompt(plan, {
+      nativeStructuredOutput,
+      responseSchema,
+      toolSchemas
+    }),
+    messages: [
+      {
+        role: "user",
+        content: buildUserMessage(plan, {
+          nativeStructuredOutput,
+          responseSchema
+        })
+      }
+    ],
+    maxTokens: effectiveMaxTokens,
+    responseSchema,
+    timeoutMs: providerTimeoutMs,
+    tools: toolSchemas?.length ? toolSchemas : undefined,
+    options:
+      providerId === "ollama"
+        ? {
+            num_predict: effectiveMaxTokens
+          }
+        : undefined
+  };
+  const thinkMode = plan?.packet?.thinkMode;
+  if (
+    thinkMode && thinkMode !== "off" &&
+    providerId === "anthropic" &&
+    process.env.ANTHROPIC_THINKING_ENABLED === "true"
+  ) {
+    const THINK_BUDGETS = { low: 1000, medium: 8000, high: 16000 };
+    const budget = THINK_BUDGETS[thinkMode] || 8000;
+    invocation.betas = [...(invocation.betas || []), "interleaved-thinking-2025-05-14"];
+    invocation.thinking = { type: "enabled", budget_tokens: budget };
+  }
+  const preflight = await buildPreflight(runtimeConfig, invocation, {
+    providerId,
+    adapter,
+    tokenCounter
+  });
+  if (preflight.pressure === "hard") {
+    throw new Error(
+      `Preflight blocked ${plan.job.id}: estimated prompt tokens ${preflight.estimatedPromptTokens} exceed hard limit ${preflight.hardLimit}`
+    );
+  }
+  return {
+    adapter,
+    providerCapabilities,
+    invocation,
+    preflight
+  };
+}
+export async function buildPreflight(runtimeConfig, invocation, options = {}) {
+  const contextTokens = runtimeConfig?.safety?.contextTokens ?? 32768;
+  const softRatio = runtimeConfig?.safety?.contextPressureSoftRatio ?? 0.72;
+  const hardRatio = runtimeConfig?.safety?.contextPressureHardRatio ?? 0.9;
+  const freshSessionOnHighPressure = runtimeConfig?.safety?.freshSessionOnHighPressure ?? true;
+  const snapshotBeforeCompaction = runtimeConfig?.safety?.snapshotBeforeCompaction ?? true;
+  const tokenCounter = options.tokenCounter || new TokenCounter();
+  const tokenEstimate = await tokenCounter.countInvocation({
+    providerId: options.providerId,
+    invocation,
+    adapter: options.adapter
+  });
+  const heuristicEstimate = tokenEstimate.mode === "heuristic" ? tokenEstimate.details : estimateInvocationTokens(invocation);
+  const estimatedPromptTokens = tokenEstimate.total;
+  const softLimit = Math.floor(contextTokens * softRatio);
+  const hardLimit = Math.floor(contextTokens * hardRatio);
+  let pressure = "low";
+  if (estimatedPromptTokens >= hardLimit) pressure = "hard";
+  else if (estimatedPromptTokens >= softLimit) pressure = "high";
+  return {
+    contextTokens,
+    estimatedPromptTokens,
+    tokenEstimate,
+    heuristicEstimate,
+    softLimit,
+    hardLimit,
+    pressure,
+    freshSessionRequired: pressure !== "low" && freshSessionOnHighPressure,
+    snapshotBeforeCompaction
+  };
+}
+async function attachVisionInputs(plan, runtimeConfig, invocation, providerCapabilities) {
+  if (!plan.packet?.imageRefs?.length || !invocation) {
+    return invocation;
+  }
+  if (providerCapabilities?.supportsVision) {
+    const tgConfig = runtimeConfig?.telegram;
+    const botToken = tgConfig?.botTokenEnv ? process.env[tgConfig.botTokenEnv] : null;
+    if (!botToken) {
+      console.warn(`[executor] imageRefs present but botToken not resolved from ${tgConfig?.botTokenEnv || "undefined env key"}`);
+      return invocation;
+    }
+    const imageBlocks = [];
+    for (const ref of plan.packet.imageRefs) {
+      const downloaded = await downloadTelegramFile(ref.fileId, botToken);
+      if (downloaded) {
+        imageBlocks.push({
+          type: "image",
+          source: {
+            type: "base64",
+            media_type: downloaded.mediaType,
+            data: downloaded.base64,
+          },
+        });
+      }
+    }
+    if (imageBlocks.length > 0) {
+      const userIdx = invocation.messages.findLastIndex((message) => message.role === "user");
+      if (userIdx !== -1) {
+        const textContent = invocation.messages[userIdx].content;
+        invocation.messages[userIdx].content = [
+          ...imageBlocks,
+          { type: "text", text: textContent },
+        ];
+      }
+    }
+    return invocation;
+  }
+  const visionNote = "[Image received but this model doesn't support vision]";
+  const userIdx = invocation.messages.findLastIndex((message) => message.role === "user");
+  if (userIdx !== -1) {
+    const existing = invocation.messages[userIdx].content;
+    invocation.messages[userIdx].content = existing
+      ? `${existing}\n\n${visionNote}`
+      : visionNote;
+  }
+  return invocation;
+}
+function annotateAttemptError(error, metadata = {}) {
+  if (!error || typeof error !== "object") {
+    return error;
+  }
+  Object.assign(error, metadata);
+  return error;
+}
+async function executeProviderCall({
+  plan,
+  runtime,
+  mode,
+  registry,
+  tokenCounter,
+  modelId,
+  providerId,
+  providerConfig,
+  routingDecision,
+  providerTimeoutMs,
+  toolSchemas,
+  buildSystemPrompt,
+  buildUserMessage,
+  onPrepared
+}) {
+  let prepared = null;
+  let invocation = null;
+  try {
+    prepared = await prepareProviderAttempt({
+      plan,
+      runtimeConfig: runtime.runtime,
+      registry,
+      tokenCounter,
+      modelId,
+      providerConfig,
+      providerId,
+      routingDecision,
+      providerTimeoutMs,
+      toolSchemas,
+      buildSystemPrompt,
+      buildUserMessage
+    });
+    if (typeof onPrepared === "function") {
+      onPrepared(prepared);
+    }
+    invocation = await attachVisionInputs(
+      plan,
+      runtime.runtime,
+      prepared.invocation,
+      prepared.providerCapabilities
+    );
+    if (mode === "dry-run") {
+      return {
+        response: null,
+        providerId,
+        modelId,
+        usage: {
+          tokensIn: 0,
+          tokensOut: 0,
+          cacheIn: 0,
+          cacheCreation: 0,
+        },
+        cached: false,
+        adapter: prepared.adapter,
+        providerCapabilities: prepared.providerCapabilities,
+        invocation,
+        preflight: prepared.preflight,
+        providerModePolicy: null,
+        health: null,
+        toolLoopEnabled: false
+      };
+    }
+    const providerModePolicy = assertProviderExecutionAllowed({
+      jobId: plan.job.id,
+      modelLane: routingDecision.selectedLane,
+      providerId,
+      interactive: plan.job.trigger === "interactive"
+    });
+    let health = null;
+    if (providerModePolicy.requireHealthyProvider) {
+      const healthCheck = await prepared.adapter.healthCheck();
+      if (!healthCheck.ok) {
+        throw new Error(`Provider health check failed for ${providerId} with status ${healthCheck.status}`);
+      }
+      health = healthCheck;
+    }
+    const response = await prepared.adapter.invoke(invocation);
+    const usage = extractUsageMetrics(response);
+    return {
+      response,
+      providerId,
+      modelId,
+      usage,
+      cached: Boolean(usage.cacheIn || usage.cacheCreation),
+      adapter: prepared.adapter,
+      providerCapabilities: prepared.providerCapabilities,
+      invocation,
+      preflight: prepared.preflight,
+      providerModePolicy,
+      health,
+      toolLoopEnabled: true
+    };
+  } catch (error) {
+    throw annotateAttemptError(error, {
+      providerId,
+      modelId,
+      routingDecision,
+      providerCapabilities: prepared?.providerCapabilities || null,
+      invocation: invocation || prepared?.invocation || null,
+      preflight: prepared?.preflight || null
+    });
+  }
+}
+function buildFallbackState(runtimeConfig, routingDecision, providerId, modelId, options) {
+  return {
+    allowed: false,
+    attempted: false,
+    trigger: null,
+    finalSourceLane: routingDecision.selectedLane,
+    sourceLane: routingDecision.selectedLane,
+    sourceProviderId: providerId,
+    sourceModelId: modelId,
+    policy: getReportFallbackPolicy(runtimeConfig, options)
+  };
+}
+export async function attemptProvider({ plan, runtime, options = {} }) {
+  const mode = options.mode || "dry-run";
+  const router = options.router || new ModelRouter(runtime.router);
+  const routingDecision = buildRoutingDecision(plan, options);
+  const laneConfig = runtime.router?.[routingDecision.selectedLane];
+  const primaryModelId = options.modelOverride || plan.packet.modelOverride || router.resolve(routingDecision.selectedLane, routingDecision.routeMode);
+  const providersToTry = [primaryModelId, ...(laneConfig?.fallbackModels || [])];
+  const toolSchemas = options.toolSchemas || [];
+  const registry = options.registry;
+  const tokenCounter = options.tokenCounter;
+  const buildSystemPrompt = options.buildSystemPrompt;
+  const buildUserMessage = options.buildUserMessage;
+  let fallback = null;
+  let primaryError = null;
+  let lastProviderId = null;
+  for (const currentModelId of providersToTry) {
+    const currentProviderId = modelToProviderId(currentModelId);
+    const providerConfig = runtime.providers[currentProviderId];
+    const providerTimeoutMs = computeProviderTimeoutMs(plan, providerConfig, options);
+    const breaker = options.getBreaker?.(currentModelId, runtime.runtime) || null;
+    lastProviderId = currentProviderId;
+    if (breaker?.isOpen()) {
+      const retryAfter = breaker.retryAfter();
+      console.warn(`[Nemoris] circuit breaker open for ${currentModelId}, skipping (retry in ${Math.ceil(retryAfter)}s)`);
+      primaryError = new Error(`Provider ${currentModelId} circuit open — retry after ${Math.ceil(retryAfter)}s`);
+      annotateAttemptError(primaryError, {
+        providerId: currentProviderId,
+        modelId: currentModelId,
+        routingDecision,
+        fallback
+      });
+      continue;
+    }
+    try {
+      const attempt = await executeProviderCall({
+        plan,
+        runtime,
+        mode,
+        registry,
+        tokenCounter,
+        modelId: currentModelId,
+        providerId: currentProviderId,
+        providerConfig,
+        routingDecision,
+        providerTimeoutMs,
+        toolSchemas,
+        buildSystemPrompt,
+        buildUserMessage,
+        onPrepared: () => {
+          if (!fallback) {
+            fallback = buildFallbackState(runtime.runtime, routingDecision, currentProviderId, currentModelId, options);
+          }
+        }
+      });
+      if (mode === "provider") {
+        breaker?.recordSuccess();
+      }
+      return {
+        ...attempt,
+        routingDecision,
+        fallback,
+        primaryModelId
+      };
+    } catch (err) {
+      primaryError = annotateAttemptError(err, {
+        providerId: currentProviderId,
+        modelId: currentModelId,
+        routingDecision,
+        fallback
+      });
+      const statusCode = err.statusCode || err.status || 0;
+      breaker?.recordFailure(statusCode);
+      if (isRetryableError(err)) {
+        console.warn(`[executor] provider ${currentModelId} failed: ${err.message}, trying next`);
+        continue;
+      }
+      break;
+    }
+  }
+  if (!primaryError) {
+    primaryError = new Error("All providers in failover chain exhausted");
+    annotateAttemptError(primaryError, {
+      routingDecision,
+      fallback
+    });
+  }
+  const failureClass = classifyRuntimeFailure(primaryError?.message || "");
+  const fallbackResolution = resolveReportFallback({
+    runtimeConfig: runtime.runtime,
+    job: plan.job,
+    routingDecision,
+    providerId: lastProviderId,
+    failureClass,
+    options
+  });
+  fallback = {
+    ...(fallback || {}),
+    allowed: fallbackResolution.allowed,
+    attempted: false,
+    trigger: failureClass,
+    localFailureClass: failureClass,
+    localError: primaryError.message,
+    blockedReason: fallbackResolution.allowed ? null : fallbackResolution.reason,
+    targetLane: fallbackResolution.targetLane || null
+  };
+  if (!fallbackResolution.allowed) {
+    annotateAttemptError(primaryError, {
+      providerId: primaryError.providerId || lastProviderId,
+      routingDecision,
+      fallback
+    });
+    throw primaryError;
+  }
+  fallback.attempted = true;
+  const fallbackRoutingDecision = {
+    ...routingDecision,
+    selectedLane: fallbackResolution.targetLane,
+    routeMode: "fallback",
+    reasons: [...(routingDecision.reasons || []), `fallback:${failureClass}`],
+    description: "Failure-triggered report fallback."
+  };
+  const fallbackModelId = router.resolve(fallbackResolution.targetLane, "primary");
+  const fallbackProviderId = modelToProviderId(fallbackModelId);
+  const fallbackProviderConfig = runtime.providers[fallbackProviderId];
+  try {
+    const attempt = await executeProviderCall({
+      plan,
+      runtime,
+      mode,
+      registry,
+      tokenCounter,
+      modelId: fallbackModelId,
+      providerId: fallbackProviderId,
+      providerConfig: fallbackProviderConfig,
+      routingDecision: fallbackRoutingDecision,
+      providerTimeoutMs: computeProviderTimeoutMs(plan, fallbackProviderConfig, options),
+      toolSchemas,
+      buildSystemPrompt,
+      buildUserMessage
+    });
+    return {
+      ...attempt,
+      routingDecision: fallbackRoutingDecision,
+      fallback: {
+        ...fallback,
+        success: true,
+        finalSourceLane: fallbackRoutingDecision.selectedLane,
+        finalProviderId: fallbackProviderId,
+        finalModelId: fallbackModelId
+      },
+      toolLoopEnabled: mode === "provider" && Boolean(options.allowToolLoopOnFallback)
+    };
+  } catch (fallbackError) {
+    fallback = {
+      ...fallback,
+      success: false,
+      fallbackFailureClass: classifyRuntimeFailure(fallbackError?.message || ""),
+      fallbackError: fallbackError.message
+    };
+    const combinedError = new Error(
+      `Primary provider failed (${failureClass}) and fallback failed: ${fallbackError.message}`
+    );
+    annotateAttemptError(combinedError, {
+      providerId: fallbackProviderId,
+      modelId: fallbackModelId,
+      routingDecision: fallbackRoutingDecision,
+      providerCapabilities: fallbackError?.providerCapabilities || null,
+      invocation: fallbackError?.invocation || null,
+      preflight: fallbackError?.preflight || null,
+      fallback
+    });
+    throw combinedError;
+  }
+}