npm - nemoris - Versions diffs - 0.1.0 - Mend

nemoris 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (223) hide show

package/.env.example +49 -0
package/LICENSE +21 -0
package/README.md +209 -0
package/SECURITY.md +119 -0
package/bin/nemoris +46 -0
package/config/agents/agent.toml.example +28 -0
package/config/agents/default.toml +22 -0
package/config/agents/orchestrator.toml +18 -0
package/config/delivery.toml +73 -0
package/config/embeddings.toml +5 -0
package/config/identity/default-purpose.md +1 -0
package/config/identity/default-soul.md +3 -0
package/config/identity/orchestrator-purpose.md +1 -0
package/config/identity/orchestrator-soul.md +1 -0
package/config/improvement-targets.toml +15 -0
package/config/jobs/heartbeat-check.toml +30 -0
package/config/jobs/memory-rollup.toml +46 -0
package/config/jobs/workspace-health.toml +63 -0
package/config/mcp.toml +16 -0
package/config/output-contracts.toml +17 -0
package/config/peers.toml +32 -0
package/config/peers.toml.example +32 -0
package/config/policies/memory-default.toml +10 -0
package/config/policies/memory-heartbeat.toml +5 -0
package/config/policies/memory-ops.toml +10 -0
package/config/policies/tools-heartbeat-minimal.toml +8 -0
package/config/policies/tools-interactive-safe.toml +8 -0
package/config/policies/tools-ops-bounded.toml +8 -0
package/config/policies/tools-orchestrator.toml +7 -0
package/config/providers/anthropic.toml +15 -0
package/config/providers/ollama.toml +5 -0
package/config/providers/openai-codex.toml +9 -0
package/config/providers/openrouter.toml +5 -0
package/config/router.toml +22 -0
package/config/runtime.toml +114 -0
package/config/skills/self-improvement.toml +15 -0
package/config/skills/telegram-onboarding-spec.md +240 -0
package/config/skills/workspace-monitor.toml +15 -0
package/config/task-router.toml +42 -0
package/install.sh +50 -0
package/package.json +90 -0
package/src/auth/auth-profiles.js +169 -0
package/src/auth/openai-codex-oauth.js +285 -0
package/src/battle.js +449 -0
package/src/cli/help.js +265 -0
package/src/cli/output-filter.js +49 -0
package/src/cli/runtime-control.js +704 -0
package/src/cli-main.js +2763 -0
package/src/cli.js +78 -0
package/src/config/loader.js +332 -0
package/src/config/schema-validator.js +214 -0
package/src/config/toml-lite.js +8 -0
package/src/daemon/action-handlers.js +71 -0
package/src/daemon/healing-tick.js +87 -0
package/src/daemon/health-probes.js +90 -0
package/src/daemon/notifier.js +57 -0
package/src/daemon/nurse.js +218 -0
package/src/daemon/repair-log.js +106 -0
package/src/daemon/rule-staging.js +90 -0
package/src/daemon/rules.js +29 -0
package/src/daemon/telegram-commands.js +54 -0
package/src/daemon/updater.js +85 -0
package/src/jobs/job-runner.js +78 -0
package/src/mcp/consumer.js +129 -0
package/src/memory/active-recall.js +171 -0
package/src/memory/backend-manager.js +97 -0
package/src/memory/backends/file-backend.js +38 -0
package/src/memory/backends/qmd-backend.js +219 -0
package/src/memory/embedding-guards.js +24 -0
package/src/memory/embedding-index.js +118 -0
package/src/memory/embedding-service.js +179 -0
package/src/memory/file-index.js +177 -0
package/src/memory/memory-signature.js +5 -0
package/src/memory/memory-store.js +648 -0
package/src/memory/retrieval-planner.js +66 -0
package/src/memory/scoring.js +145 -0
package/src/memory/simhash.js +78 -0
package/src/memory/sqlite-active-store.js +824 -0
package/src/memory/write-policy.js +36 -0
package/src/onboarding/aliases.js +33 -0
package/src/onboarding/auth/api-key.js +224 -0
package/src/onboarding/auth/ollama-detect.js +42 -0
package/src/onboarding/clack-prompter.js +77 -0
package/src/onboarding/doctor.js +530 -0
package/src/onboarding/lock.js +42 -0
package/src/onboarding/model-catalog.js +344 -0
package/src/onboarding/phases/auth.js +589 -0
package/src/onboarding/phases/build.js +130 -0
package/src/onboarding/phases/choose.js +82 -0
package/src/onboarding/phases/detect.js +98 -0
package/src/onboarding/phases/hatch.js +216 -0
package/src/onboarding/phases/identity.js +79 -0
package/src/onboarding/phases/ollama.js +345 -0
package/src/onboarding/phases/scaffold.js +99 -0
package/src/onboarding/phases/telegram.js +377 -0
package/src/onboarding/phases/validate.js +204 -0
package/src/onboarding/phases/verify.js +206 -0
package/src/onboarding/platform.js +482 -0
package/src/onboarding/status-bar.js +95 -0
package/src/onboarding/templates.js +794 -0
package/src/onboarding/toml-writer.js +38 -0
package/src/onboarding/tui.js +250 -0
package/src/onboarding/uninstall.js +153 -0
package/src/onboarding/wizard.js +499 -0
package/src/providers/anthropic.js +168 -0
package/src/providers/base.js +247 -0
package/src/providers/circuit-breaker.js +136 -0
package/src/providers/ollama.js +163 -0
package/src/providers/openai-codex.js +149 -0
package/src/providers/openrouter.js +136 -0
package/src/providers/registry.js +36 -0
package/src/providers/router.js +16 -0
package/src/runtime/bootstrap-cache.js +47 -0
package/src/runtime/capabilities-prompt.js +25 -0
package/src/runtime/completion-ping.js +99 -0
package/src/runtime/config-validator.js +121 -0
package/src/runtime/context-ledger.js +360 -0
package/src/runtime/cutover-readiness.js +42 -0
package/src/runtime/daemon.js +729 -0
package/src/runtime/delivery-ack.js +195 -0
package/src/runtime/delivery-adapters/local-file.js +41 -0
package/src/runtime/delivery-adapters/openclaw-cli.js +94 -0
package/src/runtime/delivery-adapters/openclaw-peer.js +98 -0
package/src/runtime/delivery-adapters/shadow.js +13 -0
package/src/runtime/delivery-adapters/standalone-http.js +98 -0
package/src/runtime/delivery-adapters/telegram.js +104 -0
package/src/runtime/delivery-adapters/tui.js +128 -0
package/src/runtime/delivery-manager.js +807 -0
package/src/runtime/delivery-store.js +168 -0
package/src/runtime/dependency-health.js +118 -0
package/src/runtime/envelope.js +114 -0
package/src/runtime/evaluation.js +1089 -0
package/src/runtime/exec-approvals.js +216 -0
package/src/runtime/executor.js +500 -0
package/src/runtime/failure-ping.js +67 -0
package/src/runtime/flows.js +83 -0
package/src/runtime/guards.js +45 -0
package/src/runtime/handoff.js +51 -0
package/src/runtime/identity-cache.js +28 -0
package/src/runtime/improvement-engine.js +109 -0
package/src/runtime/improvement-harness.js +581 -0
package/src/runtime/input-sanitiser.js +72 -0
package/src/runtime/interaction-contract.js +347 -0
package/src/runtime/lane-readiness.js +226 -0
package/src/runtime/migration.js +323 -0
package/src/runtime/model-resolution.js +78 -0
package/src/runtime/network.js +64 -0
package/src/runtime/notification-store.js +97 -0
package/src/runtime/notifier.js +256 -0
package/src/runtime/orchestrator.js +53 -0
package/src/runtime/orphan-reaper.js +41 -0
package/src/runtime/output-contract-schema.js +139 -0
package/src/runtime/output-contract-validator.js +439 -0
package/src/runtime/peer-readiness.js +69 -0
package/src/runtime/peer-registry.js +133 -0
package/src/runtime/pilot-status.js +108 -0
package/src/runtime/prompt-builder.js +261 -0
package/src/runtime/provider-attempt.js +582 -0
package/src/runtime/report-fallback.js +71 -0
package/src/runtime/result-normalizer.js +183 -0
package/src/runtime/retention.js +74 -0
package/src/runtime/review.js +244 -0
package/src/runtime/route-job.js +15 -0
package/src/runtime/run-store.js +38 -0
package/src/runtime/schedule.js +88 -0
package/src/runtime/scheduler-state.js +434 -0
package/src/runtime/scheduler.js +656 -0
package/src/runtime/session-compactor.js +182 -0
package/src/runtime/session-search.js +155 -0
package/src/runtime/slack-inbound.js +249 -0
package/src/runtime/ssrf.js +102 -0
package/src/runtime/status-aggregator.js +330 -0
package/src/runtime/task-contract.js +140 -0
package/src/runtime/task-packet.js +107 -0
package/src/runtime/task-router.js +140 -0
package/src/runtime/telegram-inbound.js +1565 -0
package/src/runtime/token-counter.js +134 -0
package/src/runtime/token-estimator.js +59 -0
package/src/runtime/tool-loop.js +200 -0
package/src/runtime/transport-server.js +311 -0
package/src/runtime/tui-server.js +411 -0
package/src/runtime/ulid.js +44 -0
package/src/security/ssrf-check.js +197 -0
package/src/setup.js +369 -0
package/src/shadow/bridge.js +303 -0
package/src/skills/loader.js +84 -0
package/src/tools/catalog.json +49 -0
package/src/tools/cli-delegate.js +44 -0
package/src/tools/mcp-client.js +106 -0
package/src/tools/micro/cancel-task.js +6 -0
package/src/tools/micro/complete-task.js +6 -0
package/src/tools/micro/fail-task.js +6 -0
package/src/tools/micro/http-fetch.js +74 -0
package/src/tools/micro/index.js +36 -0
package/src/tools/micro/lcm-recall.js +60 -0
package/src/tools/micro/list-dir.js +17 -0
package/src/tools/micro/list-skills.js +46 -0
package/src/tools/micro/load-skill.js +38 -0
package/src/tools/micro/memory-search.js +45 -0
package/src/tools/micro/read-file.js +11 -0
package/src/tools/micro/session-search.js +54 -0
package/src/tools/micro/shell-exec.js +43 -0
package/src/tools/micro/trigger-job.js +79 -0
package/src/tools/micro/web-search.js +58 -0
package/src/tools/micro/workspace-paths.js +39 -0
package/src/tools/micro/write-file.js +14 -0
package/src/tools/micro/write-memory.js +41 -0
package/src/tools/registry.js +348 -0
package/src/tools/tool-result-contract.js +36 -0
package/src/tui/chat.js +835 -0
package/src/tui/renderer.js +175 -0
package/src/tui/socket-client.js +217 -0
package/src/utils/canonical-json.js +29 -0
package/src/utils/compaction.js +30 -0
package/src/utils/env-loader.js +5 -0
package/src/utils/errors.js +80 -0
package/src/utils/fs.js +101 -0
package/src/utils/ids.js +5 -0
package/src/utils/model-context-limits.js +30 -0
package/src/utils/token-budget.js +74 -0
package/src/utils/usage-cost.js +25 -0
package/src/utils/usage-metrics.js +14 -0
package/vendor/smol-toml-1.5.2.tgz +0 -0

package/src/runtime/provider-attempt.js ADDED Viewed

@@ -0,0 +1,582 @@
+import { downloadTelegramFile } from "./telegram-inbound.js";
+import { ModelRouter } from "../providers/router.js";
+import { assertProviderExecutionAllowed } from "./guards.js";
+import { compileOutputContractSchema } from "./output-contract-schema.js";
+import { estimateInvocationTokens } from "./token-estimator.js";
+import { TokenCounter } from "./token-counter.js";
+import { classifyRuntimeFailure, getReportFallbackPolicy, resolveReportFallback } from "./report-fallback.js";
+import { extractUsageMetrics } from "../utils/usage-metrics.js";
+export function modelToProviderId(modelId) {
+  return String(modelId || "").split("/")[0] || null;
+}
+export function isRetryableError(err) {
+  const message = (err.message || "").toLowerCase();
+  const statusCode = err.statusCode || err.status || 0;
+  if (
+    message.includes("econnrefused") ||
+    message.includes("etimedout") ||
+    message.includes("fetch failed") ||
+    message.includes("net_error") ||
+    message.includes("timeout") ||
+    message.includes("enotfound") ||
+    message.includes("eai_again")
+  ) {
+    return true;
+  }
+  if (statusCode === 429 || (statusCode >= 500 && statusCode < 600)) {
+    return true;
+  }
+  return false;
+}
+export function computeProviderTimeoutMs(plan, providerConfig, options = {}) {
+  if (options.providerTimeoutMs != null) {
+    return Number(options.providerTimeoutMs);
+  }
+  const defaultTimeoutMs = Number(providerConfig?.defaultTimeoutMs || 0);
+  const budgetSeconds = Number(plan?.job?.budget?.maxRuntimeSeconds || 0);
+  const budgetTimeoutMs = budgetSeconds ? Math.min((budgetSeconds + 5) * 1000, 60000) : 0;
+  return Math.max(defaultTimeoutMs, budgetTimeoutMs || 0);
+}
+export function buildRoutingDecision(plan, options = {}) {
+  const routeMode = options.routeMode || plan.routing?.routeMode || "primary";
+  const selectedLane = options.laneOverride || plan.routing?.selectedLane || plan.job.modelLane;
+  return {
+    requestedLane: plan.job.modelLane,
+    selectedLane,
+    routeMode,
+    matchedRule: plan.routing?.matchedRule || null,
+    reasons: plan.routing?.reasons || [],
+    modelOverride: options.modelOverride || null
+  };
+}
+export function getLocalPromptContractOutputCap(plan, { providerId, providerCapabilities, routingDecision }) {
+  if (providerId !== "ollama") return null;
+  if (providerCapabilities?.structuredOutputMode !== "prompt_contract") return null;
+  const format = plan?.packet?.layers?.outputContract?.format || null;
+  if (format === "bulleted_briefing") return 1500;
+  if (format === "structured_rollup") return 2000;
+  if (routingDecision?.selectedLane === "local_cheap") return 400;
+  if (routingDecision?.selectedLane === "local_report") return 1200;
+  return null;
+}
+export async function prepareProviderAttempt({
+  plan,
+  runtimeConfig,
+  registry,
+  tokenCounter,
+  modelId,
+  providerConfig,
+  providerId,
+  routingDecision,
+  providerTimeoutMs,
+  toolSchemas,
+  buildSystemPrompt,
+  buildUserMessage
+}) {
+  if (!providerConfig) {
+    throw new Error(`No provider config for model ${modelId}`);
+  }
+  const adapter = registry.create(providerConfig);
+  const providerCapabilities = adapter?.getCapabilities?.() || null;
+  const nativeStructuredOutput = Boolean(
+    adapter &&
+      plan.packet.layers.outputContract &&
+      typeof adapter.supportsNativeStructuredOutput === "function" &&
+      adapter.supportsNativeStructuredOutput()
+  );
+  const responseSchema = nativeStructuredOutput
+    ? compileOutputContractSchema(plan.packet.layers.outputContract, {
+        thoughtFirst: providerCapabilities?.supportsReasoningSchema === true
+      })
+    : null;
+  const localPromptContractCap = getLocalPromptContractOutputCap(plan, {
+    providerId,
+    providerCapabilities,
+    routingDecision
+  });
+  const effectiveMaxTokens = localPromptContractCap
+    ? Math.min(Number(plan.job.budget.maxTokens || 0) || 0, localPromptContractCap)
+    : plan.job.budget.maxTokens;
+  const invocation = {
+    model: modelId,
+    system: buildSystemPrompt(plan, {
+      nativeStructuredOutput,
+      responseSchema,
+      toolSchemas
+    }),
+    messages: [
+      {
+        role: "user",
+        content: buildUserMessage(plan, {
+          nativeStructuredOutput,
+          responseSchema
+        })
+      }
+    ],
+    maxTokens: effectiveMaxTokens,
+    responseSchema,
+    timeoutMs: providerTimeoutMs,
+    tools: toolSchemas?.length ? toolSchemas : undefined,
+    options:
+      providerId === "ollama"
+        ? {
+            num_predict: effectiveMaxTokens
+          }
+        : undefined
+  };
+  const thinkMode = plan?.packet?.thinkMode;
+  if (
+    thinkMode && thinkMode !== "off" &&
+    providerId === "anthropic" &&
+    process.env.ANTHROPIC_THINKING_ENABLED === "true"
+  ) {
+    const THINK_BUDGETS = { low: 1000, medium: 8000, high: 16000 };
+    const budget = THINK_BUDGETS[thinkMode] || 8000;
+    invocation.betas = [...(invocation.betas || []), "interleaved-thinking-2025-05-14"];
+    invocation.thinking = { type: "enabled", budget_tokens: budget };
+  }
+  const preflight = await buildPreflight(runtimeConfig, invocation, {
+    providerId,
+    adapter,
+    tokenCounter
+  });
+  if (preflight.pressure === "hard") {
+    throw new Error(
+      `Preflight blocked ${plan.job.id}: estimated prompt tokens ${preflight.estimatedPromptTokens} exceed hard limit ${preflight.hardLimit}`
+    );
+  }
+  return {
+    adapter,
+    providerCapabilities,
+    invocation,
+    preflight
+  };
+}
+export async function buildPreflight(runtimeConfig, invocation, options = {}) {
+  const contextTokens = runtimeConfig?.safety?.contextTokens ?? 32768;
+  const softRatio = runtimeConfig?.safety?.contextPressureSoftRatio ?? 0.72;
+  const hardRatio = runtimeConfig?.safety?.contextPressureHardRatio ?? 0.9;
+  const freshSessionOnHighPressure = runtimeConfig?.safety?.freshSessionOnHighPressure ?? true;
+  const snapshotBeforeCompaction = runtimeConfig?.safety?.snapshotBeforeCompaction ?? true;
+  const tokenCounter = options.tokenCounter || new TokenCounter();
+  const tokenEstimate = await tokenCounter.countInvocation({
+    providerId: options.providerId,
+    invocation,
+    adapter: options.adapter
+  });
+  const heuristicEstimate = tokenEstimate.mode === "heuristic" ? tokenEstimate.details : estimateInvocationTokens(invocation);
+  const estimatedPromptTokens = tokenEstimate.total;
+  const softLimit = Math.floor(contextTokens * softRatio);
+  const hardLimit = Math.floor(contextTokens * hardRatio);
+  let pressure = "low";
+  if (estimatedPromptTokens >= hardLimit) pressure = "hard";
+  else if (estimatedPromptTokens >= softLimit) pressure = "high";
+  return {
+    contextTokens,
+    estimatedPromptTokens,
+    tokenEstimate,
+    heuristicEstimate,
+    softLimit,
+    hardLimit,
+    pressure,
+    freshSessionRequired: pressure !== "low" && freshSessionOnHighPressure,
+    snapshotBeforeCompaction
+  };
+}
+async function attachVisionInputs(plan, runtimeConfig, invocation, providerCapabilities) {
+  if (!plan.packet?.imageRefs?.length || !invocation) {
+    return invocation;
+  }
+  if (providerCapabilities?.supportsVision) {
+    const tgConfig = runtimeConfig?.telegram;
+    const botToken = tgConfig?.botTokenEnv ? process.env[tgConfig.botTokenEnv] : null;
+    if (!botToken) {
+      console.warn(`[executor] imageRefs present but botToken not resolved from ${tgConfig?.botTokenEnv || "undefined env key"}`);
+      return invocation;
+    }
+    const imageBlocks = [];
+    for (const ref of plan.packet.imageRefs) {
+      const downloaded = await downloadTelegramFile(ref.fileId, botToken);
+      if (downloaded) {
+        imageBlocks.push({
+          type: "image",
+          source: {
+            type: "base64",
+            media_type: downloaded.mediaType,
+            data: downloaded.base64,
+          },
+        });
+      }
+    }
+    if (imageBlocks.length > 0) {
+      const userIdx = invocation.messages.findLastIndex((message) => message.role === "user");
+      if (userIdx !== -1) {
+        const textContent = invocation.messages[userIdx].content;
+        invocation.messages[userIdx].content = [
+          ...imageBlocks,
+          { type: "text", text: textContent },
+        ];
+      }
+    }
+    return invocation;
+  }
+  const visionNote = "[Image received but this model doesn't support vision]";
+  const userIdx = invocation.messages.findLastIndex((message) => message.role === "user");
+  if (userIdx !== -1) {
+    const existing = invocation.messages[userIdx].content;
+    invocation.messages[userIdx].content = existing
+      ? `${existing}\n\n${visionNote}`
+      : visionNote;
+  }
+  return invocation;
+}
+function annotateAttemptError(error, metadata = {}) {
+  if (!error || typeof error !== "object") {
+    return error;
+  }
+  Object.assign(error, metadata);
+  return error;
+}
+async function executeProviderCall({
+  plan,
+  runtime,
+  mode,
+  registry,
+  tokenCounter,
+  modelId,
+  providerId,
+  providerConfig,
+  routingDecision,
+  providerTimeoutMs,
+  toolSchemas,
+  buildSystemPrompt,
+  buildUserMessage,
+  onPrepared
+}) {
+  let prepared = null;
+  let invocation = null;
+  try {
+    prepared = await prepareProviderAttempt({
+      plan,
+      runtimeConfig: runtime.runtime,
+      registry,
+      tokenCounter,
+      modelId,
+      providerConfig,
+      providerId,
+      routingDecision,
+      providerTimeoutMs,
+      toolSchemas,
+      buildSystemPrompt,
+      buildUserMessage
+    });
+    if (typeof onPrepared === "function") {
+      onPrepared(prepared);
+    }
+    invocation = await attachVisionInputs(
+      plan,
+      runtime.runtime,
+      prepared.invocation,
+      prepared.providerCapabilities
+    );
+    if (mode === "dry-run") {
+      return {
+        response: null,
+        providerId,
+        modelId,
+        usage: {
+          tokensIn: 0,
+          tokensOut: 0,
+          cacheIn: 0,
+          cacheCreation: 0,
+        },
+        cached: false,
+        adapter: prepared.adapter,
+        providerCapabilities: prepared.providerCapabilities,
+        invocation,
+        preflight: prepared.preflight,
+        providerModePolicy: null,
+        health: null,
+        toolLoopEnabled: false
+      };
+    }
+    const providerModePolicy = assertProviderExecutionAllowed({
+      jobId: plan.job.id,
+      modelLane: routingDecision.selectedLane,
+      providerId,
+      interactive: plan.job.trigger === "interactive"
+    });
+    let health = null;
+    if (providerModePolicy.requireHealthyProvider) {
+      const healthCheck = await prepared.adapter.healthCheck();
+      if (!healthCheck.ok) {
+        throw new Error(`Provider health check failed for ${providerId} with status ${healthCheck.status}`);
+      }
+      health = healthCheck;
+    }
+    const response = await prepared.adapter.invoke(invocation);
+    const usage = extractUsageMetrics(response);
+    return {
+      response,
+      providerId,
+      modelId,
+      usage,
+      cached: Boolean(usage.cacheIn || usage.cacheCreation),
+      adapter: prepared.adapter,
+      providerCapabilities: prepared.providerCapabilities,
+      invocation,
+      preflight: prepared.preflight,
+      providerModePolicy,
+      health,
+      toolLoopEnabled: true
+    };
+  } catch (error) {
+    throw annotateAttemptError(error, {
+      providerId,
+      modelId,
+      routingDecision,
+      providerCapabilities: prepared?.providerCapabilities || null,
+      invocation: invocation || prepared?.invocation || null,
+      preflight: prepared?.preflight || null
+    });
+  }
+}
+function buildFallbackState(runtimeConfig, routingDecision, providerId, modelId, options) {
+  return {
+    allowed: false,
+    attempted: false,
+    trigger: null,
+    finalSourceLane: routingDecision.selectedLane,
+    sourceLane: routingDecision.selectedLane,
+    sourceProviderId: providerId,
+    sourceModelId: modelId,
+    policy: getReportFallbackPolicy(runtimeConfig, options)
+  };
+}
+export async function attemptProvider({ plan, runtime, options = {} }) {
+  const mode = options.mode || "dry-run";
+  const router = options.router || new ModelRouter(runtime.router);
+  const routingDecision = buildRoutingDecision(plan, options);
+  const laneConfig = runtime.router?.[routingDecision.selectedLane];
+  const primaryModelId = options.modelOverride || plan.packet.modelOverride || router.resolve(routingDecision.selectedLane, routingDecision.routeMode);
+  const providersToTry = [primaryModelId, ...(laneConfig?.fallbackModels || [])];
+  const toolSchemas = options.toolSchemas || [];
+  const registry = options.registry;
+  const tokenCounter = options.tokenCounter;
+  const buildSystemPrompt = options.buildSystemPrompt;
+  const buildUserMessage = options.buildUserMessage;
+  let fallback = null;
+  let primaryError = null;
+  let lastProviderId = null;
+  for (const currentModelId of providersToTry) {
+    const currentProviderId = modelToProviderId(currentModelId);
+    const providerConfig = runtime.providers[currentProviderId];
+    const providerTimeoutMs = computeProviderTimeoutMs(plan, providerConfig, options);
+    const breaker = options.getBreaker?.(currentModelId, runtime.runtime) || null;
+    lastProviderId = currentProviderId;
+    if (breaker?.isOpen()) {
+      const retryAfter = breaker.retryAfter();
+      console.warn(`[Nemoris] circuit breaker open for ${currentModelId}, skipping (retry in ${Math.ceil(retryAfter)}s)`);
+      primaryError = new Error(`Provider ${currentModelId} circuit open — retry after ${Math.ceil(retryAfter)}s`);
+      annotateAttemptError(primaryError, {
+        providerId: currentProviderId,
+        modelId: currentModelId,
+        routingDecision,
+        fallback
+      });
+      continue;
+    }
+    try {
+      const attempt = await executeProviderCall({
+        plan,
+        runtime,
+        mode,
+        registry,
+        tokenCounter,
+        modelId: currentModelId,
+        providerId: currentProviderId,
+        providerConfig,
+        routingDecision,
+        providerTimeoutMs,
+        toolSchemas,
+        buildSystemPrompt,
+        buildUserMessage,
+        onPrepared: () => {
+          if (!fallback) {
+            fallback = buildFallbackState(runtime.runtime, routingDecision, currentProviderId, currentModelId, options);
+          }
+        }
+      });
+      if (mode === "provider") {
+        breaker?.recordSuccess();
+      }
+      return {
+        ...attempt,
+        routingDecision,
+        fallback,
+        primaryModelId
+      };
+    } catch (err) {
+      primaryError = annotateAttemptError(err, {
+        providerId: currentProviderId,
+        modelId: currentModelId,
+        routingDecision,
+        fallback
+      });
+      const statusCode = err.statusCode || err.status || 0;
+      breaker?.recordFailure(statusCode);
+      if (isRetryableError(err)) {
+        console.warn(`[executor] provider ${currentModelId} failed: ${err.message}, trying next`);
+        continue;
+      }
+      break;
+    }
+  }
+  if (!primaryError) {
+    primaryError = new Error("All providers in failover chain exhausted");
+    annotateAttemptError(primaryError, {
+      routingDecision,
+      fallback
+    });
+  }
+  const failureClass = classifyRuntimeFailure(primaryError?.message || "");
+  const fallbackResolution = resolveReportFallback({
+    runtimeConfig: runtime.runtime,
+    job: plan.job,
+    routingDecision,
+    providerId: lastProviderId,
+    failureClass,
+    options
+  });
+  fallback = {
+    ...(fallback || {}),
+    allowed: fallbackResolution.allowed,
+    attempted: false,
+    trigger: failureClass,
+    localFailureClass: failureClass,
+    localError: primaryError.message,
+    blockedReason: fallbackResolution.allowed ? null : fallbackResolution.reason,
+    targetLane: fallbackResolution.targetLane || null
+  };
+  if (!fallbackResolution.allowed) {
+    annotateAttemptError(primaryError, {
+      providerId: primaryError.providerId || lastProviderId,
+      routingDecision,
+      fallback
+    });
+    throw primaryError;
+  }
+  fallback.attempted = true;
+  const fallbackRoutingDecision = {
+    ...routingDecision,
+    selectedLane: fallbackResolution.targetLane,
+    routeMode: "fallback",
+    reasons: [...(routingDecision.reasons || []), `fallback:${failureClass}`],
+    description: "Failure-triggered report fallback."
+  };
+  const fallbackModelId = router.resolve(fallbackResolution.targetLane, "primary");
+  const fallbackProviderId = modelToProviderId(fallbackModelId);
+  const fallbackProviderConfig = runtime.providers[fallbackProviderId];
+  try {
+    const attempt = await executeProviderCall({
+      plan,
+      runtime,
+      mode,
+      registry,
+      tokenCounter,
+      modelId: fallbackModelId,
+      providerId: fallbackProviderId,
+      providerConfig: fallbackProviderConfig,
+      routingDecision: fallbackRoutingDecision,
+      providerTimeoutMs: computeProviderTimeoutMs(plan, fallbackProviderConfig, options),
+      toolSchemas,
+      buildSystemPrompt,
+      buildUserMessage
+    });
+    return {
+      ...attempt,
+      routingDecision: fallbackRoutingDecision,
+      fallback: {
+        ...fallback,
+        success: true,
+        finalSourceLane: fallbackRoutingDecision.selectedLane,
+        finalProviderId: fallbackProviderId,
+        finalModelId: fallbackModelId
+      },
+      toolLoopEnabled: mode === "provider" && Boolean(options.allowToolLoopOnFallback)
+    };
+  } catch (fallbackError) {
+    fallback = {
+      ...fallback,
+      success: false,
+      fallbackFailureClass: classifyRuntimeFailure(fallbackError?.message || ""),
+      fallbackError: fallbackError.message
+    };
+    const combinedError = new Error(
+      `Primary provider failed (${failureClass}) and fallback failed: ${fallbackError.message}`
+    );
+    annotateAttemptError(combinedError, {
+      providerId: fallbackProviderId,
+      modelId: fallbackModelId,
+      routingDecision: fallbackRoutingDecision,
+      providerCapabilities: fallbackError?.providerCapabilities || null,
+      invocation: fallbackError?.invocation || null,
+      preflight: fallbackError?.preflight || null,
+      fallback
+    });
+    throw combinedError;
+  }
+}

package/src/runtime/report-fallback.js ADDED Viewed

@@ -0,0 +1,71 @@
+import { getProviderModePolicy } from "./guards.js";
+function readFlag(name) {
+  const raw = process.env[name];
+  return raw === "1" || raw === "true";
+}
+export function classifyRuntimeFailure(message) {
+  const normalized = String(message || "").toLowerCase();
+  if (!normalized) return "unknown_failure";
+  if (normalized.includes("timed out")) return "timeout";
+  if (normalized.includes("loading model") || normalized.includes("server loading")) return "provider_loading";
+  if (normalized.includes("missing auth token") || normalized.includes("missing api key")) return "auth_missing";
+  if (normalized.includes("model") && normalized.includes("not found")) return "missing_model";
+  if (normalized.includes("structured") && normalized.includes("output")) return "structured_output_failure";
+  if (normalized.includes("provider error")) return "provider_error";
+  return "unknown_failure";
+}
+export function getReportFallbackPolicy(runtimeConfig = {}, options = {}) {
+  const configured = runtimeConfig?.reportFallback || {};
+  const envEnabled = readFlag("NEMORIS_ALLOW_REPORT_FALLBACK");
+  const allowReportFallback = Boolean(options.allowReportFallback || envEnabled || configured.enabled === true);
+  return {
+    enabled: allowReportFallback,
+    configEnabled: configured.enabled === true,
+    envEnabled,
+    overrideEnabled: Boolean(options.allowReportFallback),
+    lane: configured.lane || "report_fallback_lowcost",
+    allowedJobIds: configured.allowedJobIds || ["workspace-health"],
+    allowedFailureClasses: configured.allowedFailureClasses || ["timeout", "provider_loading"]
+  };
+}
+export function resolveReportFallback({ runtimeConfig, job, routingDecision, providerId, failureClass, options = {} }) {
+  const policy = getReportFallbackPolicy(runtimeConfig, options);
+  const jobPolicy = job?.reportFallback || null;
+  if (!jobPolicy?.enabled) {
+    return { allowed: false, policy, reason: "Job is not configured for report fallback." };
+  }
+  if (!policy.enabled) {
+    return { allowed: false, policy, reason: "Report fallback is disabled." };
+  }
+  if (!policy.allowedJobIds.includes(job.id)) {
+    return { allowed: false, policy, reason: `Job ${job.id} is not allowed to use report fallback.` };
+  }
+  if (!policy.allowedFailureClasses.includes(failureClass)) {
+    return { allowed: false, policy, reason: `Failure class ${failureClass} does not qualify for report fallback.` };
+  }
+  if (providerId !== "ollama" || routingDecision?.selectedLane !== "local_report") {
+    return { allowed: false, policy, reason: "Report fallback only applies after local_report Ollama failures." };
+  }
+  const providerModePolicy = getProviderModePolicy();
+  if (!providerModePolicy.allowRemoteProviders) {
+    return { allowed: false, policy, reason: "Remote provider execution is not enabled." };
+  }
+  return {
+    allowed: true,
+    policy,
+    targetLane: jobPolicy.lane || policy.lane,
+    trigger: failureClass
+  };
+}