nemoris 0.1.0 → 0.1.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (248) hide show
  1. package/.env.example +49 -49
  2. package/LICENSE +21 -21
  3. package/README.md +209 -209
  4. package/SECURITY.md +59 -119
  5. package/bin/nemoris +46 -46
  6. package/config/agents/agent.toml.example +28 -28
  7. package/config/agents/content.toml +23 -0
  8. package/config/agents/default.toml +22 -22
  9. package/config/agents/heartbeat.toml +35 -0
  10. package/config/agents/iris.toml +23 -0
  11. package/config/agents/lab.toml +23 -0
  12. package/config/agents/main.toml +45 -0
  13. package/config/agents/nemo.toml +21 -0
  14. package/config/agents/ops.toml +38 -0
  15. package/config/agents/orchestrator.toml +18 -18
  16. package/config/agents/revenue.toml +23 -0
  17. package/config/agents/testyboo.toml +19 -0
  18. package/config/delivery.toml +73 -73
  19. package/config/embeddings.toml +5 -5
  20. package/config/identity/content-purpose.md +11 -0
  21. package/config/identity/content-soul.md +45 -0
  22. package/config/identity/default-purpose.md +1 -1
  23. package/config/identity/default-soul.md +3 -3
  24. package/config/identity/heartbeat-purpose.md +9 -0
  25. package/config/identity/heartbeat-soul.md +16 -0
  26. package/config/identity/iris-purpose.md +17 -0
  27. package/config/identity/iris-soul.md +68 -0
  28. package/config/identity/lab-purpose.md +10 -0
  29. package/config/identity/lab-soul.md +38 -0
  30. package/config/identity/main-purpose.md +17 -0
  31. package/config/identity/main-soul.md +66 -0
  32. package/config/identity/main-user.md +22 -0
  33. package/config/identity/ops-purpose.md +9 -0
  34. package/config/identity/ops-soul.md +16 -0
  35. package/config/identity/orchestrator-purpose.md +1 -1
  36. package/config/identity/orchestrator-soul.md +1 -1
  37. package/config/identity/revenue-purpose.md +9 -0
  38. package/config/identity/revenue-soul.md +41 -0
  39. package/config/identity/testyboo-purpose.md +13 -0
  40. package/config/identity/testyboo-soul.md +20 -0
  41. package/config/improvement-targets.toml +15 -15
  42. package/config/jobs/heartbeat-check.toml +30 -30
  43. package/config/jobs/memory-rollup.toml +46 -46
  44. package/config/jobs/workspace-health.toml +63 -63
  45. package/config/mcp.toml +16 -16
  46. package/config/output-contracts.toml +17 -17
  47. package/config/peers.toml +32 -32
  48. package/config/peers.toml.example +32 -32
  49. package/config/policies/memory-default.toml +10 -10
  50. package/config/policies/memory-heartbeat.toml +5 -5
  51. package/config/policies/memory-ops.toml +10 -10
  52. package/config/policies/tools-heartbeat-minimal.toml +8 -8
  53. package/config/policies/tools-interactive-safe.toml +8 -8
  54. package/config/policies/tools-ops-bounded.toml +8 -8
  55. package/config/policies/tools-orchestrator.toml +7 -7
  56. package/config/providers/anthropic.toml +15 -15
  57. package/config/providers/ollama.toml +5 -5
  58. package/config/providers/openai-codex.toml +9 -9
  59. package/config/providers/openrouter.toml +5 -5
  60. package/config/router.toml +22 -22
  61. package/config/runtime.toml +114 -114
  62. package/config/skills/self-improvement.toml +15 -15
  63. package/config/skills/telegram-onboarding-spec.md +240 -240
  64. package/config/skills/workspace-monitor.toml +15 -15
  65. package/config/task-router.toml +42 -42
  66. package/install.sh +50 -50
  67. package/package.json +91 -90
  68. package/src/auth/auth-profiles.js +169 -169
  69. package/src/auth/openai-codex-oauth.js +285 -285
  70. package/src/battle.js +449 -449
  71. package/src/cli/help.js +265 -265
  72. package/src/cli/output-filter.js +49 -49
  73. package/src/cli/runtime-control.js +704 -704
  74. package/src/cli-main.js +2763 -2763
  75. package/src/cli.js +78 -78
  76. package/src/config/loader.js +332 -332
  77. package/src/config/schema-validator.js +214 -214
  78. package/src/config/toml-lite.js +8 -8
  79. package/src/daemon/action-handlers.js +71 -71
  80. package/src/daemon/healing-tick.js +87 -87
  81. package/src/daemon/health-probes.js +90 -90
  82. package/src/daemon/notifier.js +57 -57
  83. package/src/daemon/nurse.js +218 -218
  84. package/src/daemon/repair-log.js +106 -106
  85. package/src/daemon/rule-staging.js +90 -90
  86. package/src/daemon/rules.js +29 -29
  87. package/src/daemon/telegram-commands.js +54 -54
  88. package/src/daemon/updater.js +85 -85
  89. package/src/jobs/job-runner.js +78 -78
  90. package/src/mcp/consumer.js +129 -129
  91. package/src/memory/active-recall.js +171 -171
  92. package/src/memory/backend-manager.js +97 -97
  93. package/src/memory/backends/file-backend.js +38 -38
  94. package/src/memory/backends/qmd-backend.js +219 -219
  95. package/src/memory/embedding-guards.js +24 -24
  96. package/src/memory/embedding-index.js +118 -118
  97. package/src/memory/embedding-service.js +179 -179
  98. package/src/memory/file-index.js +177 -177
  99. package/src/memory/memory-signature.js +5 -5
  100. package/src/memory/memory-store.js +648 -648
  101. package/src/memory/retrieval-planner.js +66 -66
  102. package/src/memory/scoring.js +145 -145
  103. package/src/memory/simhash.js +78 -78
  104. package/src/memory/sqlite-active-store.js +824 -824
  105. package/src/memory/write-policy.js +36 -36
  106. package/src/onboarding/aliases.js +33 -33
  107. package/src/onboarding/auth/api-key.js +224 -224
  108. package/src/onboarding/auth/ollama-detect.js +42 -42
  109. package/src/onboarding/clack-prompter.js +77 -77
  110. package/src/onboarding/doctor.js +530 -530
  111. package/src/onboarding/lock.js +42 -42
  112. package/src/onboarding/model-catalog.js +344 -344
  113. package/src/onboarding/phases/auth.js +576 -589
  114. package/src/onboarding/phases/build.js +130 -130
  115. package/src/onboarding/phases/choose.js +82 -82
  116. package/src/onboarding/phases/detect.js +98 -98
  117. package/src/onboarding/phases/hatch.js +216 -216
  118. package/src/onboarding/phases/identity.js +79 -79
  119. package/src/onboarding/phases/ollama.js +345 -345
  120. package/src/onboarding/phases/scaffold.js +99 -99
  121. package/src/onboarding/phases/telegram.js +377 -377
  122. package/src/onboarding/phases/validate.js +204 -204
  123. package/src/onboarding/phases/verify.js +206 -206
  124. package/src/onboarding/platform.js +482 -482
  125. package/src/onboarding/status-bar.js +95 -95
  126. package/src/onboarding/templates.js +794 -794
  127. package/src/onboarding/toml-writer.js +38 -38
  128. package/src/onboarding/tui.js +250 -250
  129. package/src/onboarding/uninstall.js +153 -153
  130. package/src/onboarding/wizard.js +516 -499
  131. package/src/providers/anthropic.js +168 -168
  132. package/src/providers/base.js +247 -247
  133. package/src/providers/circuit-breaker.js +136 -136
  134. package/src/providers/ollama.js +163 -163
  135. package/src/providers/openai-codex.js +149 -149
  136. package/src/providers/openrouter.js +136 -136
  137. package/src/providers/registry.js +36 -36
  138. package/src/providers/router.js +16 -16
  139. package/src/runtime/bootstrap-cache.js +47 -47
  140. package/src/runtime/capabilities-prompt.js +25 -25
  141. package/src/runtime/completion-ping.js +99 -99
  142. package/src/runtime/config-validator.js +121 -121
  143. package/src/runtime/context-ledger.js +360 -360
  144. package/src/runtime/cutover-readiness.js +42 -42
  145. package/src/runtime/daemon.js +729 -729
  146. package/src/runtime/delivery-ack.js +195 -195
  147. package/src/runtime/delivery-adapters/local-file.js +41 -41
  148. package/src/runtime/delivery-adapters/openclaw-cli.js +94 -94
  149. package/src/runtime/delivery-adapters/openclaw-peer.js +98 -98
  150. package/src/runtime/delivery-adapters/shadow.js +13 -13
  151. package/src/runtime/delivery-adapters/standalone-http.js +98 -98
  152. package/src/runtime/delivery-adapters/telegram.js +104 -104
  153. package/src/runtime/delivery-adapters/tui.js +128 -128
  154. package/src/runtime/delivery-manager.js +807 -807
  155. package/src/runtime/delivery-store.js +168 -168
  156. package/src/runtime/dependency-health.js +118 -118
  157. package/src/runtime/envelope.js +114 -114
  158. package/src/runtime/evaluation.js +1089 -1089
  159. package/src/runtime/exec-approvals.js +216 -216
  160. package/src/runtime/executor.js +500 -500
  161. package/src/runtime/failure-ping.js +67 -67
  162. package/src/runtime/flows.js +83 -83
  163. package/src/runtime/guards.js +45 -45
  164. package/src/runtime/handoff.js +51 -51
  165. package/src/runtime/identity-cache.js +28 -28
  166. package/src/runtime/improvement-engine.js +109 -109
  167. package/src/runtime/improvement-harness.js +581 -581
  168. package/src/runtime/input-sanitiser.js +72 -72
  169. package/src/runtime/interaction-contract.js +347 -347
  170. package/src/runtime/lane-readiness.js +226 -226
  171. package/src/runtime/migration.js +323 -323
  172. package/src/runtime/model-resolution.js +78 -78
  173. package/src/runtime/network.js +64 -64
  174. package/src/runtime/notification-store.js +97 -97
  175. package/src/runtime/notifier.js +256 -256
  176. package/src/runtime/orchestrator.js +53 -53
  177. package/src/runtime/orphan-reaper.js +41 -41
  178. package/src/runtime/output-contract-schema.js +139 -139
  179. package/src/runtime/output-contract-validator.js +439 -439
  180. package/src/runtime/peer-readiness.js +69 -69
  181. package/src/runtime/peer-registry.js +133 -133
  182. package/src/runtime/pilot-status.js +108 -108
  183. package/src/runtime/prompt-builder.js +261 -261
  184. package/src/runtime/provider-attempt.js +582 -582
  185. package/src/runtime/report-fallback.js +71 -71
  186. package/src/runtime/result-normalizer.js +183 -183
  187. package/src/runtime/retention.js +74 -74
  188. package/src/runtime/review.js +244 -244
  189. package/src/runtime/route-job.js +15 -15
  190. package/src/runtime/run-store.js +38 -38
  191. package/src/runtime/schedule.js +88 -88
  192. package/src/runtime/scheduler-state.js +434 -434
  193. package/src/runtime/scheduler.js +656 -656
  194. package/src/runtime/session-compactor.js +182 -182
  195. package/src/runtime/session-search.js +155 -155
  196. package/src/runtime/slack-inbound.js +249 -249
  197. package/src/runtime/ssrf.js +102 -102
  198. package/src/runtime/status-aggregator.js +330 -330
  199. package/src/runtime/task-contract.js +140 -140
  200. package/src/runtime/task-packet.js +107 -107
  201. package/src/runtime/task-router.js +140 -140
  202. package/src/runtime/telegram-inbound.js +1565 -1565
  203. package/src/runtime/token-counter.js +134 -134
  204. package/src/runtime/token-estimator.js +59 -59
  205. package/src/runtime/tool-loop.js +200 -200
  206. package/src/runtime/transport-server.js +311 -311
  207. package/src/runtime/tui-server.js +411 -411
  208. package/src/runtime/ulid.js +44 -44
  209. package/src/security/ssrf-check.js +197 -197
  210. package/src/setup.js +369 -369
  211. package/src/shadow/bridge.js +303 -303
  212. package/src/skills/loader.js +84 -84
  213. package/src/tools/catalog.json +49 -49
  214. package/src/tools/cli-delegate.js +44 -44
  215. package/src/tools/mcp-client.js +106 -106
  216. package/src/tools/micro/cancel-task.js +6 -6
  217. package/src/tools/micro/complete-task.js +6 -6
  218. package/src/tools/micro/fail-task.js +6 -6
  219. package/src/tools/micro/http-fetch.js +74 -74
  220. package/src/tools/micro/index.js +36 -36
  221. package/src/tools/micro/lcm-recall.js +60 -60
  222. package/src/tools/micro/list-dir.js +17 -17
  223. package/src/tools/micro/list-skills.js +46 -46
  224. package/src/tools/micro/load-skill.js +38 -38
  225. package/src/tools/micro/memory-search.js +45 -45
  226. package/src/tools/micro/read-file.js +11 -11
  227. package/src/tools/micro/session-search.js +54 -54
  228. package/src/tools/micro/shell-exec.js +43 -43
  229. package/src/tools/micro/trigger-job.js +79 -79
  230. package/src/tools/micro/web-search.js +58 -58
  231. package/src/tools/micro/workspace-paths.js +39 -39
  232. package/src/tools/micro/write-file.js +14 -14
  233. package/src/tools/micro/write-memory.js +41 -41
  234. package/src/tools/registry.js +348 -348
  235. package/src/tools/tool-result-contract.js +36 -36
  236. package/src/tui/chat.js +835 -835
  237. package/src/tui/renderer.js +175 -175
  238. package/src/tui/socket-client.js +217 -217
  239. package/src/utils/canonical-json.js +29 -29
  240. package/src/utils/compaction.js +30 -30
  241. package/src/utils/env-loader.js +5 -5
  242. package/src/utils/errors.js +80 -80
  243. package/src/utils/fs.js +101 -101
  244. package/src/utils/ids.js +5 -5
  245. package/src/utils/model-context-limits.js +30 -30
  246. package/src/utils/token-budget.js +74 -74
  247. package/src/utils/usage-cost.js +25 -25
  248. package/src/utils/usage-metrics.js +14 -14
@@ -1,582 +1,582 @@
1
- import { downloadTelegramFile } from "./telegram-inbound.js";
2
- import { ModelRouter } from "../providers/router.js";
3
- import { assertProviderExecutionAllowed } from "./guards.js";
4
- import { compileOutputContractSchema } from "./output-contract-schema.js";
5
- import { estimateInvocationTokens } from "./token-estimator.js";
6
- import { TokenCounter } from "./token-counter.js";
7
- import { classifyRuntimeFailure, getReportFallbackPolicy, resolveReportFallback } from "./report-fallback.js";
8
- import { extractUsageMetrics } from "../utils/usage-metrics.js";
9
-
10
- export function modelToProviderId(modelId) {
11
- return String(modelId || "").split("/")[0] || null;
12
- }
13
-
14
- export function isRetryableError(err) {
15
- const message = (err.message || "").toLowerCase();
16
- const statusCode = err.statusCode || err.status || 0;
17
-
18
- if (
19
- message.includes("econnrefused") ||
20
- message.includes("etimedout") ||
21
- message.includes("fetch failed") ||
22
- message.includes("net_error") ||
23
- message.includes("timeout") ||
24
- message.includes("enotfound") ||
25
- message.includes("eai_again")
26
- ) {
27
- return true;
28
- }
29
-
30
- if (statusCode === 429 || (statusCode >= 500 && statusCode < 600)) {
31
- return true;
32
- }
33
-
34
- return false;
35
- }
36
-
37
- export function computeProviderTimeoutMs(plan, providerConfig, options = {}) {
38
- if (options.providerTimeoutMs != null) {
39
- return Number(options.providerTimeoutMs);
40
- }
41
-
42
- const defaultTimeoutMs = Number(providerConfig?.defaultTimeoutMs || 0);
43
- const budgetSeconds = Number(plan?.job?.budget?.maxRuntimeSeconds || 0);
44
- const budgetTimeoutMs = budgetSeconds ? Math.min((budgetSeconds + 5) * 1000, 60000) : 0;
45
- return Math.max(defaultTimeoutMs, budgetTimeoutMs || 0);
46
- }
47
-
48
- export function buildRoutingDecision(plan, options = {}) {
49
- const routeMode = options.routeMode || plan.routing?.routeMode || "primary";
50
- const selectedLane = options.laneOverride || plan.routing?.selectedLane || plan.job.modelLane;
51
- return {
52
- requestedLane: plan.job.modelLane,
53
- selectedLane,
54
- routeMode,
55
- matchedRule: plan.routing?.matchedRule || null,
56
- reasons: plan.routing?.reasons || [],
57
- modelOverride: options.modelOverride || null
58
- };
59
- }
60
-
61
- export function getLocalPromptContractOutputCap(plan, { providerId, providerCapabilities, routingDecision }) {
62
- if (providerId !== "ollama") return null;
63
- if (providerCapabilities?.structuredOutputMode !== "prompt_contract") return null;
64
-
65
- const format = plan?.packet?.layers?.outputContract?.format || null;
66
- if (format === "bulleted_briefing") return 1500;
67
- if (format === "structured_rollup") return 2000;
68
-
69
- if (routingDecision?.selectedLane === "local_cheap") return 400;
70
- if (routingDecision?.selectedLane === "local_report") return 1200;
71
- return null;
72
- }
73
-
74
- export async function prepareProviderAttempt({
75
- plan,
76
- runtimeConfig,
77
- registry,
78
- tokenCounter,
79
- modelId,
80
- providerConfig,
81
- providerId,
82
- routingDecision,
83
- providerTimeoutMs,
84
- toolSchemas,
85
- buildSystemPrompt,
86
- buildUserMessage
87
- }) {
88
- if (!providerConfig) {
89
- throw new Error(`No provider config for model ${modelId}`);
90
- }
91
- const adapter = registry.create(providerConfig);
92
- const providerCapabilities = adapter?.getCapabilities?.() || null;
93
- const nativeStructuredOutput = Boolean(
94
- adapter &&
95
- plan.packet.layers.outputContract &&
96
- typeof adapter.supportsNativeStructuredOutput === "function" &&
97
- adapter.supportsNativeStructuredOutput()
98
- );
99
- const responseSchema = nativeStructuredOutput
100
- ? compileOutputContractSchema(plan.packet.layers.outputContract, {
101
- thoughtFirst: providerCapabilities?.supportsReasoningSchema === true
102
- })
103
- : null;
104
-
105
- const localPromptContractCap = getLocalPromptContractOutputCap(plan, {
106
- providerId,
107
- providerCapabilities,
108
- routingDecision
109
- });
110
- const effectiveMaxTokens = localPromptContractCap
111
- ? Math.min(Number(plan.job.budget.maxTokens || 0) || 0, localPromptContractCap)
112
- : plan.job.budget.maxTokens;
113
-
114
- const invocation = {
115
- model: modelId,
116
- system: buildSystemPrompt(plan, {
117
- nativeStructuredOutput,
118
- responseSchema,
119
- toolSchemas
120
- }),
121
- messages: [
122
- {
123
- role: "user",
124
- content: buildUserMessage(plan, {
125
- nativeStructuredOutput,
126
- responseSchema
127
- })
128
- }
129
- ],
130
- maxTokens: effectiveMaxTokens,
131
- responseSchema,
132
- timeoutMs: providerTimeoutMs,
133
- tools: toolSchemas?.length ? toolSchemas : undefined,
134
- options:
135
- providerId === "ollama"
136
- ? {
137
- num_predict: effectiveMaxTokens
138
- }
139
- : undefined
140
- };
141
-
142
- const thinkMode = plan?.packet?.thinkMode;
143
- if (
144
- thinkMode && thinkMode !== "off" &&
145
- providerId === "anthropic" &&
146
- process.env.ANTHROPIC_THINKING_ENABLED === "true"
147
- ) {
148
- const THINK_BUDGETS = { low: 1000, medium: 8000, high: 16000 };
149
- const budget = THINK_BUDGETS[thinkMode] || 8000;
150
- invocation.betas = [...(invocation.betas || []), "interleaved-thinking-2025-05-14"];
151
- invocation.thinking = { type: "enabled", budget_tokens: budget };
152
- }
153
-
154
- const preflight = await buildPreflight(runtimeConfig, invocation, {
155
- providerId,
156
- adapter,
157
- tokenCounter
158
- });
159
-
160
- if (preflight.pressure === "hard") {
161
- throw new Error(
162
- `Preflight blocked ${plan.job.id}: estimated prompt tokens ${preflight.estimatedPromptTokens} exceed hard limit ${preflight.hardLimit}`
163
- );
164
- }
165
-
166
- return {
167
- adapter,
168
- providerCapabilities,
169
- invocation,
170
- preflight
171
- };
172
- }
173
-
174
- export async function buildPreflight(runtimeConfig, invocation, options = {}) {
175
- const contextTokens = runtimeConfig?.safety?.contextTokens ?? 32768;
176
- const softRatio = runtimeConfig?.safety?.contextPressureSoftRatio ?? 0.72;
177
- const hardRatio = runtimeConfig?.safety?.contextPressureHardRatio ?? 0.9;
178
- const freshSessionOnHighPressure = runtimeConfig?.safety?.freshSessionOnHighPressure ?? true;
179
- const snapshotBeforeCompaction = runtimeConfig?.safety?.snapshotBeforeCompaction ?? true;
180
- const tokenCounter = options.tokenCounter || new TokenCounter();
181
- const tokenEstimate = await tokenCounter.countInvocation({
182
- providerId: options.providerId,
183
- invocation,
184
- adapter: options.adapter
185
- });
186
- const heuristicEstimate = tokenEstimate.mode === "heuristic" ? tokenEstimate.details : estimateInvocationTokens(invocation);
187
- const estimatedPromptTokens = tokenEstimate.total;
188
- const softLimit = Math.floor(contextTokens * softRatio);
189
- const hardLimit = Math.floor(contextTokens * hardRatio);
190
-
191
- let pressure = "low";
192
- if (estimatedPromptTokens >= hardLimit) pressure = "hard";
193
- else if (estimatedPromptTokens >= softLimit) pressure = "high";
194
-
195
- return {
196
- contextTokens,
197
- estimatedPromptTokens,
198
- tokenEstimate,
199
- heuristicEstimate,
200
- softLimit,
201
- hardLimit,
202
- pressure,
203
- freshSessionRequired: pressure !== "low" && freshSessionOnHighPressure,
204
- snapshotBeforeCompaction
205
- };
206
- }
207
-
208
- async function attachVisionInputs(plan, runtimeConfig, invocation, providerCapabilities) {
209
- if (!plan.packet?.imageRefs?.length || !invocation) {
210
- return invocation;
211
- }
212
-
213
- if (providerCapabilities?.supportsVision) {
214
- const tgConfig = runtimeConfig?.telegram;
215
- const botToken = tgConfig?.botTokenEnv ? process.env[tgConfig.botTokenEnv] : null;
216
- if (!botToken) {
217
- console.warn(`[executor] imageRefs present but botToken not resolved from ${tgConfig?.botTokenEnv || "undefined env key"}`);
218
- return invocation;
219
- }
220
-
221
- const imageBlocks = [];
222
- for (const ref of plan.packet.imageRefs) {
223
- const downloaded = await downloadTelegramFile(ref.fileId, botToken);
224
- if (downloaded) {
225
- imageBlocks.push({
226
- type: "image",
227
- source: {
228
- type: "base64",
229
- media_type: downloaded.mediaType,
230
- data: downloaded.base64,
231
- },
232
- });
233
- }
234
- }
235
-
236
- if (imageBlocks.length > 0) {
237
- const userIdx = invocation.messages.findLastIndex((message) => message.role === "user");
238
- if (userIdx !== -1) {
239
- const textContent = invocation.messages[userIdx].content;
240
- invocation.messages[userIdx].content = [
241
- ...imageBlocks,
242
- { type: "text", text: textContent },
243
- ];
244
- }
245
- }
246
- return invocation;
247
- }
248
-
249
- const visionNote = "[Image received but this model doesn't support vision]";
250
- const userIdx = invocation.messages.findLastIndex((message) => message.role === "user");
251
- if (userIdx !== -1) {
252
- const existing = invocation.messages[userIdx].content;
253
- invocation.messages[userIdx].content = existing
254
- ? `${existing}\n\n${visionNote}`
255
- : visionNote;
256
- }
257
- return invocation;
258
- }
259
-
260
- function annotateAttemptError(error, metadata = {}) {
261
- if (!error || typeof error !== "object") {
262
- return error;
263
- }
264
-
265
- Object.assign(error, metadata);
266
- return error;
267
- }
268
-
269
- async function executeProviderCall({
270
- plan,
271
- runtime,
272
- mode,
273
- registry,
274
- tokenCounter,
275
- modelId,
276
- providerId,
277
- providerConfig,
278
- routingDecision,
279
- providerTimeoutMs,
280
- toolSchemas,
281
- buildSystemPrompt,
282
- buildUserMessage,
283
- onPrepared
284
- }) {
285
- let prepared = null;
286
- let invocation = null;
287
-
288
- try {
289
- prepared = await prepareProviderAttempt({
290
- plan,
291
- runtimeConfig: runtime.runtime,
292
- registry,
293
- tokenCounter,
294
- modelId,
295
- providerConfig,
296
- providerId,
297
- routingDecision,
298
- providerTimeoutMs,
299
- toolSchemas,
300
- buildSystemPrompt,
301
- buildUserMessage
302
- });
303
-
304
- if (typeof onPrepared === "function") {
305
- onPrepared(prepared);
306
- }
307
-
308
- invocation = await attachVisionInputs(
309
- plan,
310
- runtime.runtime,
311
- prepared.invocation,
312
- prepared.providerCapabilities
313
- );
314
-
315
- if (mode === "dry-run") {
316
- return {
317
- response: null,
318
- providerId,
319
- modelId,
320
- usage: {
321
- tokensIn: 0,
322
- tokensOut: 0,
323
- cacheIn: 0,
324
- cacheCreation: 0,
325
- },
326
- cached: false,
327
- adapter: prepared.adapter,
328
- providerCapabilities: prepared.providerCapabilities,
329
- invocation,
330
- preflight: prepared.preflight,
331
- providerModePolicy: null,
332
- health: null,
333
- toolLoopEnabled: false
334
- };
335
- }
336
-
337
- const providerModePolicy = assertProviderExecutionAllowed({
338
- jobId: plan.job.id,
339
- modelLane: routingDecision.selectedLane,
340
- providerId,
341
- interactive: plan.job.trigger === "interactive"
342
- });
343
-
344
- let health = null;
345
- if (providerModePolicy.requireHealthyProvider) {
346
- const healthCheck = await prepared.adapter.healthCheck();
347
- if (!healthCheck.ok) {
348
- throw new Error(`Provider health check failed for ${providerId} with status ${healthCheck.status}`);
349
- }
350
- health = healthCheck;
351
- }
352
-
353
- const response = await prepared.adapter.invoke(invocation);
354
- const usage = extractUsageMetrics(response);
355
-
356
- return {
357
- response,
358
- providerId,
359
- modelId,
360
- usage,
361
- cached: Boolean(usage.cacheIn || usage.cacheCreation),
362
- adapter: prepared.adapter,
363
- providerCapabilities: prepared.providerCapabilities,
364
- invocation,
365
- preflight: prepared.preflight,
366
- providerModePolicy,
367
- health,
368
- toolLoopEnabled: true
369
- };
370
- } catch (error) {
371
- throw annotateAttemptError(error, {
372
- providerId,
373
- modelId,
374
- routingDecision,
375
- providerCapabilities: prepared?.providerCapabilities || null,
376
- invocation: invocation || prepared?.invocation || null,
377
- preflight: prepared?.preflight || null
378
- });
379
- }
380
- }
381
-
382
- function buildFallbackState(runtimeConfig, routingDecision, providerId, modelId, options) {
383
- return {
384
- allowed: false,
385
- attempted: false,
386
- trigger: null,
387
- finalSourceLane: routingDecision.selectedLane,
388
- sourceLane: routingDecision.selectedLane,
389
- sourceProviderId: providerId,
390
- sourceModelId: modelId,
391
- policy: getReportFallbackPolicy(runtimeConfig, options)
392
- };
393
- }
394
-
395
- export async function attemptProvider({ plan, runtime, options = {} }) {
396
- const mode = options.mode || "dry-run";
397
- const router = options.router || new ModelRouter(runtime.router);
398
- const routingDecision = buildRoutingDecision(plan, options);
399
- const laneConfig = runtime.router?.[routingDecision.selectedLane];
400
- const primaryModelId = options.modelOverride || plan.packet.modelOverride || router.resolve(routingDecision.selectedLane, routingDecision.routeMode);
401
- const providersToTry = [primaryModelId, ...(laneConfig?.fallbackModels || [])];
402
- const toolSchemas = options.toolSchemas || [];
403
- const registry = options.registry;
404
- const tokenCounter = options.tokenCounter;
405
- const buildSystemPrompt = options.buildSystemPrompt;
406
- const buildUserMessage = options.buildUserMessage;
407
-
408
- let fallback = null;
409
- let primaryError = null;
410
- let lastProviderId = null;
411
-
412
- for (const currentModelId of providersToTry) {
413
- const currentProviderId = modelToProviderId(currentModelId);
414
- const providerConfig = runtime.providers[currentProviderId];
415
- const providerTimeoutMs = computeProviderTimeoutMs(plan, providerConfig, options);
416
- const breaker = options.getBreaker?.(currentModelId, runtime.runtime) || null;
417
- lastProviderId = currentProviderId;
418
-
419
- if (breaker?.isOpen()) {
420
- const retryAfter = breaker.retryAfter();
421
- console.warn(`[Nemoris] circuit breaker open for ${currentModelId}, skipping (retry in ${Math.ceil(retryAfter)}s)`);
422
- primaryError = new Error(`Provider ${currentModelId} circuit open — retry after ${Math.ceil(retryAfter)}s`);
423
- annotateAttemptError(primaryError, {
424
- providerId: currentProviderId,
425
- modelId: currentModelId,
426
- routingDecision,
427
- fallback
428
- });
429
- continue;
430
- }
431
-
432
- try {
433
- const attempt = await executeProviderCall({
434
- plan,
435
- runtime,
436
- mode,
437
- registry,
438
- tokenCounter,
439
- modelId: currentModelId,
440
- providerId: currentProviderId,
441
- providerConfig,
442
- routingDecision,
443
- providerTimeoutMs,
444
- toolSchemas,
445
- buildSystemPrompt,
446
- buildUserMessage,
447
- onPrepared: () => {
448
- if (!fallback) {
449
- fallback = buildFallbackState(runtime.runtime, routingDecision, currentProviderId, currentModelId, options);
450
- }
451
- }
452
- });
453
-
454
- if (mode === "provider") {
455
- breaker?.recordSuccess();
456
- }
457
-
458
- return {
459
- ...attempt,
460
- routingDecision,
461
- fallback,
462
- primaryModelId
463
- };
464
- } catch (err) {
465
- primaryError = annotateAttemptError(err, {
466
- providerId: currentProviderId,
467
- modelId: currentModelId,
468
- routingDecision,
469
- fallback
470
- });
471
- const statusCode = err.statusCode || err.status || 0;
472
- breaker?.recordFailure(statusCode);
473
-
474
- if (isRetryableError(err)) {
475
- console.warn(`[executor] provider ${currentModelId} failed: ${err.message}, trying next`);
476
- continue;
477
- }
478
- break;
479
- }
480
- }
481
-
482
- if (!primaryError) {
483
- primaryError = new Error("All providers in failover chain exhausted");
484
- annotateAttemptError(primaryError, {
485
- routingDecision,
486
- fallback
487
- });
488
- }
489
-
490
- const failureClass = classifyRuntimeFailure(primaryError?.message || "");
491
- const fallbackResolution = resolveReportFallback({
492
- runtimeConfig: runtime.runtime,
493
- job: plan.job,
494
- routingDecision,
495
- providerId: lastProviderId,
496
- failureClass,
497
- options
498
- });
499
-
500
- fallback = {
501
- ...(fallback || {}),
502
- allowed: fallbackResolution.allowed,
503
- attempted: false,
504
- trigger: failureClass,
505
- localFailureClass: failureClass,
506
- localError: primaryError.message,
507
- blockedReason: fallbackResolution.allowed ? null : fallbackResolution.reason,
508
- targetLane: fallbackResolution.targetLane || null
509
- };
510
-
511
- if (!fallbackResolution.allowed) {
512
- annotateAttemptError(primaryError, {
513
- providerId: primaryError.providerId || lastProviderId,
514
- routingDecision,
515
- fallback
516
- });
517
- throw primaryError;
518
- }
519
-
520
- fallback.attempted = true;
521
- const fallbackRoutingDecision = {
522
- ...routingDecision,
523
- selectedLane: fallbackResolution.targetLane,
524
- routeMode: "fallback",
525
- reasons: [...(routingDecision.reasons || []), `fallback:${failureClass}`],
526
- description: "Failure-triggered report fallback."
527
- };
528
- const fallbackModelId = router.resolve(fallbackResolution.targetLane, "primary");
529
- const fallbackProviderId = modelToProviderId(fallbackModelId);
530
- const fallbackProviderConfig = runtime.providers[fallbackProviderId];
531
-
532
- try {
533
- const attempt = await executeProviderCall({
534
- plan,
535
- runtime,
536
- mode,
537
- registry,
538
- tokenCounter,
539
- modelId: fallbackModelId,
540
- providerId: fallbackProviderId,
541
- providerConfig: fallbackProviderConfig,
542
- routingDecision: fallbackRoutingDecision,
543
- providerTimeoutMs: computeProviderTimeoutMs(plan, fallbackProviderConfig, options),
544
- toolSchemas,
545
- buildSystemPrompt,
546
- buildUserMessage
547
- });
548
-
549
- return {
550
- ...attempt,
551
- routingDecision: fallbackRoutingDecision,
552
- fallback: {
553
- ...fallback,
554
- success: true,
555
- finalSourceLane: fallbackRoutingDecision.selectedLane,
556
- finalProviderId: fallbackProviderId,
557
- finalModelId: fallbackModelId
558
- },
559
- toolLoopEnabled: mode === "provider" && Boolean(options.allowToolLoopOnFallback)
560
- };
561
- } catch (fallbackError) {
562
- fallback = {
563
- ...fallback,
564
- success: false,
565
- fallbackFailureClass: classifyRuntimeFailure(fallbackError?.message || ""),
566
- fallbackError: fallbackError.message
567
- };
568
- const combinedError = new Error(
569
- `Primary provider failed (${failureClass}) and fallback failed: ${fallbackError.message}`
570
- );
571
- annotateAttemptError(combinedError, {
572
- providerId: fallbackProviderId,
573
- modelId: fallbackModelId,
574
- routingDecision: fallbackRoutingDecision,
575
- providerCapabilities: fallbackError?.providerCapabilities || null,
576
- invocation: fallbackError?.invocation || null,
577
- preflight: fallbackError?.preflight || null,
578
- fallback
579
- });
580
- throw combinedError;
581
- }
582
- }
1
+ import { downloadTelegramFile } from "./telegram-inbound.js";
2
+ import { ModelRouter } from "../providers/router.js";
3
+ import { assertProviderExecutionAllowed } from "./guards.js";
4
+ import { compileOutputContractSchema } from "./output-contract-schema.js";
5
+ import { estimateInvocationTokens } from "./token-estimator.js";
6
+ import { TokenCounter } from "./token-counter.js";
7
+ import { classifyRuntimeFailure, getReportFallbackPolicy, resolveReportFallback } from "./report-fallback.js";
8
+ import { extractUsageMetrics } from "../utils/usage-metrics.js";
9
+
10
+ export function modelToProviderId(modelId) {
11
+ return String(modelId || "").split("/")[0] || null;
12
+ }
13
+
14
+ export function isRetryableError(err) {
15
+ const message = (err.message || "").toLowerCase();
16
+ const statusCode = err.statusCode || err.status || 0;
17
+
18
+ if (
19
+ message.includes("econnrefused") ||
20
+ message.includes("etimedout") ||
21
+ message.includes("fetch failed") ||
22
+ message.includes("net_error") ||
23
+ message.includes("timeout") ||
24
+ message.includes("enotfound") ||
25
+ message.includes("eai_again")
26
+ ) {
27
+ return true;
28
+ }
29
+
30
+ if (statusCode === 429 || (statusCode >= 500 && statusCode < 600)) {
31
+ return true;
32
+ }
33
+
34
+ return false;
35
+ }
36
+
37
+ export function computeProviderTimeoutMs(plan, providerConfig, options = {}) {
38
+ if (options.providerTimeoutMs != null) {
39
+ return Number(options.providerTimeoutMs);
40
+ }
41
+
42
+ const defaultTimeoutMs = Number(providerConfig?.defaultTimeoutMs || 0);
43
+ const budgetSeconds = Number(plan?.job?.budget?.maxRuntimeSeconds || 0);
44
+ const budgetTimeoutMs = budgetSeconds ? Math.min((budgetSeconds + 5) * 1000, 60000) : 0;
45
+ return Math.max(defaultTimeoutMs, budgetTimeoutMs || 0);
46
+ }
47
+
48
+ export function buildRoutingDecision(plan, options = {}) {
49
+ const routeMode = options.routeMode || plan.routing?.routeMode || "primary";
50
+ const selectedLane = options.laneOverride || plan.routing?.selectedLane || plan.job.modelLane;
51
+ return {
52
+ requestedLane: plan.job.modelLane,
53
+ selectedLane,
54
+ routeMode,
55
+ matchedRule: plan.routing?.matchedRule || null,
56
+ reasons: plan.routing?.reasons || [],
57
+ modelOverride: options.modelOverride || null
58
+ };
59
+ }
60
+
61
+ export function getLocalPromptContractOutputCap(plan, { providerId, providerCapabilities, routingDecision }) {
62
+ if (providerId !== "ollama") return null;
63
+ if (providerCapabilities?.structuredOutputMode !== "prompt_contract") return null;
64
+
65
+ const format = plan?.packet?.layers?.outputContract?.format || null;
66
+ if (format === "bulleted_briefing") return 1500;
67
+ if (format === "structured_rollup") return 2000;
68
+
69
+ if (routingDecision?.selectedLane === "local_cheap") return 400;
70
+ if (routingDecision?.selectedLane === "local_report") return 1200;
71
+ return null;
72
+ }
73
+
74
+ export async function prepareProviderAttempt({
75
+ plan,
76
+ runtimeConfig,
77
+ registry,
78
+ tokenCounter,
79
+ modelId,
80
+ providerConfig,
81
+ providerId,
82
+ routingDecision,
83
+ providerTimeoutMs,
84
+ toolSchemas,
85
+ buildSystemPrompt,
86
+ buildUserMessage
87
+ }) {
88
+ if (!providerConfig) {
89
+ throw new Error(`No provider config for model ${modelId}`);
90
+ }
91
+ const adapter = registry.create(providerConfig);
92
+ const providerCapabilities = adapter?.getCapabilities?.() || null;
93
+ const nativeStructuredOutput = Boolean(
94
+ adapter &&
95
+ plan.packet.layers.outputContract &&
96
+ typeof adapter.supportsNativeStructuredOutput === "function" &&
97
+ adapter.supportsNativeStructuredOutput()
98
+ );
99
+ const responseSchema = nativeStructuredOutput
100
+ ? compileOutputContractSchema(plan.packet.layers.outputContract, {
101
+ thoughtFirst: providerCapabilities?.supportsReasoningSchema === true
102
+ })
103
+ : null;
104
+
105
+ const localPromptContractCap = getLocalPromptContractOutputCap(plan, {
106
+ providerId,
107
+ providerCapabilities,
108
+ routingDecision
109
+ });
110
+ const effectiveMaxTokens = localPromptContractCap
111
+ ? Math.min(Number(plan.job.budget.maxTokens || 0) || 0, localPromptContractCap)
112
+ : plan.job.budget.maxTokens;
113
+
114
+ const invocation = {
115
+ model: modelId,
116
+ system: buildSystemPrompt(plan, {
117
+ nativeStructuredOutput,
118
+ responseSchema,
119
+ toolSchemas
120
+ }),
121
+ messages: [
122
+ {
123
+ role: "user",
124
+ content: buildUserMessage(plan, {
125
+ nativeStructuredOutput,
126
+ responseSchema
127
+ })
128
+ }
129
+ ],
130
+ maxTokens: effectiveMaxTokens,
131
+ responseSchema,
132
+ timeoutMs: providerTimeoutMs,
133
+ tools: toolSchemas?.length ? toolSchemas : undefined,
134
+ options:
135
+ providerId === "ollama"
136
+ ? {
137
+ num_predict: effectiveMaxTokens
138
+ }
139
+ : undefined
140
+ };
141
+
142
+ const thinkMode = plan?.packet?.thinkMode;
143
+ if (
144
+ thinkMode && thinkMode !== "off" &&
145
+ providerId === "anthropic" &&
146
+ process.env.ANTHROPIC_THINKING_ENABLED === "true"
147
+ ) {
148
+ const THINK_BUDGETS = { low: 1000, medium: 8000, high: 16000 };
149
+ const budget = THINK_BUDGETS[thinkMode] || 8000;
150
+ invocation.betas = [...(invocation.betas || []), "interleaved-thinking-2025-05-14"];
151
+ invocation.thinking = { type: "enabled", budget_tokens: budget };
152
+ }
153
+
154
+ const preflight = await buildPreflight(runtimeConfig, invocation, {
155
+ providerId,
156
+ adapter,
157
+ tokenCounter
158
+ });
159
+
160
+ if (preflight.pressure === "hard") {
161
+ throw new Error(
162
+ `Preflight blocked ${plan.job.id}: estimated prompt tokens ${preflight.estimatedPromptTokens} exceed hard limit ${preflight.hardLimit}`
163
+ );
164
+ }
165
+
166
+ return {
167
+ adapter,
168
+ providerCapabilities,
169
+ invocation,
170
+ preflight
171
+ };
172
+ }
173
+
174
+ export async function buildPreflight(runtimeConfig, invocation, options = {}) {
175
+ const contextTokens = runtimeConfig?.safety?.contextTokens ?? 32768;
176
+ const softRatio = runtimeConfig?.safety?.contextPressureSoftRatio ?? 0.72;
177
+ const hardRatio = runtimeConfig?.safety?.contextPressureHardRatio ?? 0.9;
178
+ const freshSessionOnHighPressure = runtimeConfig?.safety?.freshSessionOnHighPressure ?? true;
179
+ const snapshotBeforeCompaction = runtimeConfig?.safety?.snapshotBeforeCompaction ?? true;
180
+ const tokenCounter = options.tokenCounter || new TokenCounter();
181
+ const tokenEstimate = await tokenCounter.countInvocation({
182
+ providerId: options.providerId,
183
+ invocation,
184
+ adapter: options.adapter
185
+ });
186
+ const heuristicEstimate = tokenEstimate.mode === "heuristic" ? tokenEstimate.details : estimateInvocationTokens(invocation);
187
+ const estimatedPromptTokens = tokenEstimate.total;
188
+ const softLimit = Math.floor(contextTokens * softRatio);
189
+ const hardLimit = Math.floor(contextTokens * hardRatio);
190
+
191
+ let pressure = "low";
192
+ if (estimatedPromptTokens >= hardLimit) pressure = "hard";
193
+ else if (estimatedPromptTokens >= softLimit) pressure = "high";
194
+
195
+ return {
196
+ contextTokens,
197
+ estimatedPromptTokens,
198
+ tokenEstimate,
199
+ heuristicEstimate,
200
+ softLimit,
201
+ hardLimit,
202
+ pressure,
203
+ freshSessionRequired: pressure !== "low" && freshSessionOnHighPressure,
204
+ snapshotBeforeCompaction
205
+ };
206
+ }
207
+
208
+ async function attachVisionInputs(plan, runtimeConfig, invocation, providerCapabilities) {
209
+ if (!plan.packet?.imageRefs?.length || !invocation) {
210
+ return invocation;
211
+ }
212
+
213
+ if (providerCapabilities?.supportsVision) {
214
+ const tgConfig = runtimeConfig?.telegram;
215
+ const botToken = tgConfig?.botTokenEnv ? process.env[tgConfig.botTokenEnv] : null;
216
+ if (!botToken) {
217
+ console.warn(`[executor] imageRefs present but botToken not resolved from ${tgConfig?.botTokenEnv || "undefined env key"}`);
218
+ return invocation;
219
+ }
220
+
221
+ const imageBlocks = [];
222
+ for (const ref of plan.packet.imageRefs) {
223
+ const downloaded = await downloadTelegramFile(ref.fileId, botToken);
224
+ if (downloaded) {
225
+ imageBlocks.push({
226
+ type: "image",
227
+ source: {
228
+ type: "base64",
229
+ media_type: downloaded.mediaType,
230
+ data: downloaded.base64,
231
+ },
232
+ });
233
+ }
234
+ }
235
+
236
+ if (imageBlocks.length > 0) {
237
+ const userIdx = invocation.messages.findLastIndex((message) => message.role === "user");
238
+ if (userIdx !== -1) {
239
+ const textContent = invocation.messages[userIdx].content;
240
+ invocation.messages[userIdx].content = [
241
+ ...imageBlocks,
242
+ { type: "text", text: textContent },
243
+ ];
244
+ }
245
+ }
246
+ return invocation;
247
+ }
248
+
249
+ const visionNote = "[Image received but this model doesn't support vision]";
250
+ const userIdx = invocation.messages.findLastIndex((message) => message.role === "user");
251
+ if (userIdx !== -1) {
252
+ const existing = invocation.messages[userIdx].content;
253
+ invocation.messages[userIdx].content = existing
254
+ ? `${existing}\n\n${visionNote}`
255
+ : visionNote;
256
+ }
257
+ return invocation;
258
+ }
259
+
260
+ function annotateAttemptError(error, metadata = {}) {
261
+ if (!error || typeof error !== "object") {
262
+ return error;
263
+ }
264
+
265
+ Object.assign(error, metadata);
266
+ return error;
267
+ }
268
+
269
+ async function executeProviderCall({
270
+ plan,
271
+ runtime,
272
+ mode,
273
+ registry,
274
+ tokenCounter,
275
+ modelId,
276
+ providerId,
277
+ providerConfig,
278
+ routingDecision,
279
+ providerTimeoutMs,
280
+ toolSchemas,
281
+ buildSystemPrompt,
282
+ buildUserMessage,
283
+ onPrepared
284
+ }) {
285
+ let prepared = null;
286
+ let invocation = null;
287
+
288
+ try {
289
+ prepared = await prepareProviderAttempt({
290
+ plan,
291
+ runtimeConfig: runtime.runtime,
292
+ registry,
293
+ tokenCounter,
294
+ modelId,
295
+ providerConfig,
296
+ providerId,
297
+ routingDecision,
298
+ providerTimeoutMs,
299
+ toolSchemas,
300
+ buildSystemPrompt,
301
+ buildUserMessage
302
+ });
303
+
304
+ if (typeof onPrepared === "function") {
305
+ onPrepared(prepared);
306
+ }
307
+
308
+ invocation = await attachVisionInputs(
309
+ plan,
310
+ runtime.runtime,
311
+ prepared.invocation,
312
+ prepared.providerCapabilities
313
+ );
314
+
315
+ if (mode === "dry-run") {
316
+ return {
317
+ response: null,
318
+ providerId,
319
+ modelId,
320
+ usage: {
321
+ tokensIn: 0,
322
+ tokensOut: 0,
323
+ cacheIn: 0,
324
+ cacheCreation: 0,
325
+ },
326
+ cached: false,
327
+ adapter: prepared.adapter,
328
+ providerCapabilities: prepared.providerCapabilities,
329
+ invocation,
330
+ preflight: prepared.preflight,
331
+ providerModePolicy: null,
332
+ health: null,
333
+ toolLoopEnabled: false
334
+ };
335
+ }
336
+
337
+ const providerModePolicy = assertProviderExecutionAllowed({
338
+ jobId: plan.job.id,
339
+ modelLane: routingDecision.selectedLane,
340
+ providerId,
341
+ interactive: plan.job.trigger === "interactive"
342
+ });
343
+
344
+ let health = null;
345
+ if (providerModePolicy.requireHealthyProvider) {
346
+ const healthCheck = await prepared.adapter.healthCheck();
347
+ if (!healthCheck.ok) {
348
+ throw new Error(`Provider health check failed for ${providerId} with status ${healthCheck.status}`);
349
+ }
350
+ health = healthCheck;
351
+ }
352
+
353
+ const response = await prepared.adapter.invoke(invocation);
354
+ const usage = extractUsageMetrics(response);
355
+
356
+ return {
357
+ response,
358
+ providerId,
359
+ modelId,
360
+ usage,
361
+ cached: Boolean(usage.cacheIn || usage.cacheCreation),
362
+ adapter: prepared.adapter,
363
+ providerCapabilities: prepared.providerCapabilities,
364
+ invocation,
365
+ preflight: prepared.preflight,
366
+ providerModePolicy,
367
+ health,
368
+ toolLoopEnabled: true
369
+ };
370
+ } catch (error) {
371
+ throw annotateAttemptError(error, {
372
+ providerId,
373
+ modelId,
374
+ routingDecision,
375
+ providerCapabilities: prepared?.providerCapabilities || null,
376
+ invocation: invocation || prepared?.invocation || null,
377
+ preflight: prepared?.preflight || null
378
+ });
379
+ }
380
+ }
381
+
382
+ function buildFallbackState(runtimeConfig, routingDecision, providerId, modelId, options) {
383
+ return {
384
+ allowed: false,
385
+ attempted: false,
386
+ trigger: null,
387
+ finalSourceLane: routingDecision.selectedLane,
388
+ sourceLane: routingDecision.selectedLane,
389
+ sourceProviderId: providerId,
390
+ sourceModelId: modelId,
391
+ policy: getReportFallbackPolicy(runtimeConfig, options)
392
+ };
393
+ }
394
+
395
+ export async function attemptProvider({ plan, runtime, options = {} }) {
396
+ const mode = options.mode || "dry-run";
397
+ const router = options.router || new ModelRouter(runtime.router);
398
+ const routingDecision = buildRoutingDecision(plan, options);
399
+ const laneConfig = runtime.router?.[routingDecision.selectedLane];
400
+ const primaryModelId = options.modelOverride || plan.packet.modelOverride || router.resolve(routingDecision.selectedLane, routingDecision.routeMode);
401
+ const providersToTry = [primaryModelId, ...(laneConfig?.fallbackModels || [])];
402
+ const toolSchemas = options.toolSchemas || [];
403
+ const registry = options.registry;
404
+ const tokenCounter = options.tokenCounter;
405
+ const buildSystemPrompt = options.buildSystemPrompt;
406
+ const buildUserMessage = options.buildUserMessage;
407
+
408
+ let fallback = null;
409
+ let primaryError = null;
410
+ let lastProviderId = null;
411
+
412
+ for (const currentModelId of providersToTry) {
413
+ const currentProviderId = modelToProviderId(currentModelId);
414
+ const providerConfig = runtime.providers[currentProviderId];
415
+ const providerTimeoutMs = computeProviderTimeoutMs(plan, providerConfig, options);
416
+ const breaker = options.getBreaker?.(currentModelId, runtime.runtime) || null;
417
+ lastProviderId = currentProviderId;
418
+
419
+ if (breaker?.isOpen()) {
420
+ const retryAfter = breaker.retryAfter();
421
+ console.warn(`[Nemoris] circuit breaker open for ${currentModelId}, skipping (retry in ${Math.ceil(retryAfter)}s)`);
422
+ primaryError = new Error(`Provider ${currentModelId} circuit open — retry after ${Math.ceil(retryAfter)}s`);
423
+ annotateAttemptError(primaryError, {
424
+ providerId: currentProviderId,
425
+ modelId: currentModelId,
426
+ routingDecision,
427
+ fallback
428
+ });
429
+ continue;
430
+ }
431
+
432
+ try {
433
+ const attempt = await executeProviderCall({
434
+ plan,
435
+ runtime,
436
+ mode,
437
+ registry,
438
+ tokenCounter,
439
+ modelId: currentModelId,
440
+ providerId: currentProviderId,
441
+ providerConfig,
442
+ routingDecision,
443
+ providerTimeoutMs,
444
+ toolSchemas,
445
+ buildSystemPrompt,
446
+ buildUserMessage,
447
+ onPrepared: () => {
448
+ if (!fallback) {
449
+ fallback = buildFallbackState(runtime.runtime, routingDecision, currentProviderId, currentModelId, options);
450
+ }
451
+ }
452
+ });
453
+
454
+ if (mode === "provider") {
455
+ breaker?.recordSuccess();
456
+ }
457
+
458
+ return {
459
+ ...attempt,
460
+ routingDecision,
461
+ fallback,
462
+ primaryModelId
463
+ };
464
+ } catch (err) {
465
+ primaryError = annotateAttemptError(err, {
466
+ providerId: currentProviderId,
467
+ modelId: currentModelId,
468
+ routingDecision,
469
+ fallback
470
+ });
471
+ const statusCode = err.statusCode || err.status || 0;
472
+ breaker?.recordFailure(statusCode);
473
+
474
+ if (isRetryableError(err)) {
475
+ console.warn(`[executor] provider ${currentModelId} failed: ${err.message}, trying next`);
476
+ continue;
477
+ }
478
+ break;
479
+ }
480
+ }
481
+
482
+ if (!primaryError) {
483
+ primaryError = new Error("All providers in failover chain exhausted");
484
+ annotateAttemptError(primaryError, {
485
+ routingDecision,
486
+ fallback
487
+ });
488
+ }
489
+
490
+ const failureClass = classifyRuntimeFailure(primaryError?.message || "");
491
+ const fallbackResolution = resolveReportFallback({
492
+ runtimeConfig: runtime.runtime,
493
+ job: plan.job,
494
+ routingDecision,
495
+ providerId: lastProviderId,
496
+ failureClass,
497
+ options
498
+ });
499
+
500
+ fallback = {
501
+ ...(fallback || {}),
502
+ allowed: fallbackResolution.allowed,
503
+ attempted: false,
504
+ trigger: failureClass,
505
+ localFailureClass: failureClass,
506
+ localError: primaryError.message,
507
+ blockedReason: fallbackResolution.allowed ? null : fallbackResolution.reason,
508
+ targetLane: fallbackResolution.targetLane || null
509
+ };
510
+
511
+ if (!fallbackResolution.allowed) {
512
+ annotateAttemptError(primaryError, {
513
+ providerId: primaryError.providerId || lastProviderId,
514
+ routingDecision,
515
+ fallback
516
+ });
517
+ throw primaryError;
518
+ }
519
+
520
+ fallback.attempted = true;
521
+ const fallbackRoutingDecision = {
522
+ ...routingDecision,
523
+ selectedLane: fallbackResolution.targetLane,
524
+ routeMode: "fallback",
525
+ reasons: [...(routingDecision.reasons || []), `fallback:${failureClass}`],
526
+ description: "Failure-triggered report fallback."
527
+ };
528
+ const fallbackModelId = router.resolve(fallbackResolution.targetLane, "primary");
529
+ const fallbackProviderId = modelToProviderId(fallbackModelId);
530
+ const fallbackProviderConfig = runtime.providers[fallbackProviderId];
531
+
532
+ try {
533
+ const attempt = await executeProviderCall({
534
+ plan,
535
+ runtime,
536
+ mode,
537
+ registry,
538
+ tokenCounter,
539
+ modelId: fallbackModelId,
540
+ providerId: fallbackProviderId,
541
+ providerConfig: fallbackProviderConfig,
542
+ routingDecision: fallbackRoutingDecision,
543
+ providerTimeoutMs: computeProviderTimeoutMs(plan, fallbackProviderConfig, options),
544
+ toolSchemas,
545
+ buildSystemPrompt,
546
+ buildUserMessage
547
+ });
548
+
549
+ return {
550
+ ...attempt,
551
+ routingDecision: fallbackRoutingDecision,
552
+ fallback: {
553
+ ...fallback,
554
+ success: true,
555
+ finalSourceLane: fallbackRoutingDecision.selectedLane,
556
+ finalProviderId: fallbackProviderId,
557
+ finalModelId: fallbackModelId
558
+ },
559
+ toolLoopEnabled: mode === "provider" && Boolean(options.allowToolLoopOnFallback)
560
+ };
561
+ } catch (fallbackError) {
562
+ fallback = {
563
+ ...fallback,
564
+ success: false,
565
+ fallbackFailureClass: classifyRuntimeFailure(fallbackError?.message || ""),
566
+ fallbackError: fallbackError.message
567
+ };
568
+ const combinedError = new Error(
569
+ `Primary provider failed (${failureClass}) and fallback failed: ${fallbackError.message}`
570
+ );
571
+ annotateAttemptError(combinedError, {
572
+ providerId: fallbackProviderId,
573
+ modelId: fallbackModelId,
574
+ routingDecision: fallbackRoutingDecision,
575
+ providerCapabilities: fallbackError?.providerCapabilities || null,
576
+ invocation: fallbackError?.invocation || null,
577
+ preflight: fallbackError?.preflight || null,
578
+ fallback
579
+ });
580
+ throw combinedError;
581
+ }
582
+ }