nemoris 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (223) hide show
  1. package/.env.example +49 -0
  2. package/LICENSE +21 -0
  3. package/README.md +209 -0
  4. package/SECURITY.md +119 -0
  5. package/bin/nemoris +46 -0
  6. package/config/agents/agent.toml.example +28 -0
  7. package/config/agents/default.toml +22 -0
  8. package/config/agents/orchestrator.toml +18 -0
  9. package/config/delivery.toml +73 -0
  10. package/config/embeddings.toml +5 -0
  11. package/config/identity/default-purpose.md +1 -0
  12. package/config/identity/default-soul.md +3 -0
  13. package/config/identity/orchestrator-purpose.md +1 -0
  14. package/config/identity/orchestrator-soul.md +1 -0
  15. package/config/improvement-targets.toml +15 -0
  16. package/config/jobs/heartbeat-check.toml +30 -0
  17. package/config/jobs/memory-rollup.toml +46 -0
  18. package/config/jobs/workspace-health.toml +63 -0
  19. package/config/mcp.toml +16 -0
  20. package/config/output-contracts.toml +17 -0
  21. package/config/peers.toml +32 -0
  22. package/config/peers.toml.example +32 -0
  23. package/config/policies/memory-default.toml +10 -0
  24. package/config/policies/memory-heartbeat.toml +5 -0
  25. package/config/policies/memory-ops.toml +10 -0
  26. package/config/policies/tools-heartbeat-minimal.toml +8 -0
  27. package/config/policies/tools-interactive-safe.toml +8 -0
  28. package/config/policies/tools-ops-bounded.toml +8 -0
  29. package/config/policies/tools-orchestrator.toml +7 -0
  30. package/config/providers/anthropic.toml +15 -0
  31. package/config/providers/ollama.toml +5 -0
  32. package/config/providers/openai-codex.toml +9 -0
  33. package/config/providers/openrouter.toml +5 -0
  34. package/config/router.toml +22 -0
  35. package/config/runtime.toml +114 -0
  36. package/config/skills/self-improvement.toml +15 -0
  37. package/config/skills/telegram-onboarding-spec.md +240 -0
  38. package/config/skills/workspace-monitor.toml +15 -0
  39. package/config/task-router.toml +42 -0
  40. package/install.sh +50 -0
  41. package/package.json +90 -0
  42. package/src/auth/auth-profiles.js +169 -0
  43. package/src/auth/openai-codex-oauth.js +285 -0
  44. package/src/battle.js +449 -0
  45. package/src/cli/help.js +265 -0
  46. package/src/cli/output-filter.js +49 -0
  47. package/src/cli/runtime-control.js +704 -0
  48. package/src/cli-main.js +2763 -0
  49. package/src/cli.js +78 -0
  50. package/src/config/loader.js +332 -0
  51. package/src/config/schema-validator.js +214 -0
  52. package/src/config/toml-lite.js +8 -0
  53. package/src/daemon/action-handlers.js +71 -0
  54. package/src/daemon/healing-tick.js +87 -0
  55. package/src/daemon/health-probes.js +90 -0
  56. package/src/daemon/notifier.js +57 -0
  57. package/src/daemon/nurse.js +218 -0
  58. package/src/daemon/repair-log.js +106 -0
  59. package/src/daemon/rule-staging.js +90 -0
  60. package/src/daemon/rules.js +29 -0
  61. package/src/daemon/telegram-commands.js +54 -0
  62. package/src/daemon/updater.js +85 -0
  63. package/src/jobs/job-runner.js +78 -0
  64. package/src/mcp/consumer.js +129 -0
  65. package/src/memory/active-recall.js +171 -0
  66. package/src/memory/backend-manager.js +97 -0
  67. package/src/memory/backends/file-backend.js +38 -0
  68. package/src/memory/backends/qmd-backend.js +219 -0
  69. package/src/memory/embedding-guards.js +24 -0
  70. package/src/memory/embedding-index.js +118 -0
  71. package/src/memory/embedding-service.js +179 -0
  72. package/src/memory/file-index.js +177 -0
  73. package/src/memory/memory-signature.js +5 -0
  74. package/src/memory/memory-store.js +648 -0
  75. package/src/memory/retrieval-planner.js +66 -0
  76. package/src/memory/scoring.js +145 -0
  77. package/src/memory/simhash.js +78 -0
  78. package/src/memory/sqlite-active-store.js +824 -0
  79. package/src/memory/write-policy.js +36 -0
  80. package/src/onboarding/aliases.js +33 -0
  81. package/src/onboarding/auth/api-key.js +224 -0
  82. package/src/onboarding/auth/ollama-detect.js +42 -0
  83. package/src/onboarding/clack-prompter.js +77 -0
  84. package/src/onboarding/doctor.js +530 -0
  85. package/src/onboarding/lock.js +42 -0
  86. package/src/onboarding/model-catalog.js +344 -0
  87. package/src/onboarding/phases/auth.js +589 -0
  88. package/src/onboarding/phases/build.js +130 -0
  89. package/src/onboarding/phases/choose.js +82 -0
  90. package/src/onboarding/phases/detect.js +98 -0
  91. package/src/onboarding/phases/hatch.js +216 -0
  92. package/src/onboarding/phases/identity.js +79 -0
  93. package/src/onboarding/phases/ollama.js +345 -0
  94. package/src/onboarding/phases/scaffold.js +99 -0
  95. package/src/onboarding/phases/telegram.js +377 -0
  96. package/src/onboarding/phases/validate.js +204 -0
  97. package/src/onboarding/phases/verify.js +206 -0
  98. package/src/onboarding/platform.js +482 -0
  99. package/src/onboarding/status-bar.js +95 -0
  100. package/src/onboarding/templates.js +794 -0
  101. package/src/onboarding/toml-writer.js +38 -0
  102. package/src/onboarding/tui.js +250 -0
  103. package/src/onboarding/uninstall.js +153 -0
  104. package/src/onboarding/wizard.js +499 -0
  105. package/src/providers/anthropic.js +168 -0
  106. package/src/providers/base.js +247 -0
  107. package/src/providers/circuit-breaker.js +136 -0
  108. package/src/providers/ollama.js +163 -0
  109. package/src/providers/openai-codex.js +149 -0
  110. package/src/providers/openrouter.js +136 -0
  111. package/src/providers/registry.js +36 -0
  112. package/src/providers/router.js +16 -0
  113. package/src/runtime/bootstrap-cache.js +47 -0
  114. package/src/runtime/capabilities-prompt.js +25 -0
  115. package/src/runtime/completion-ping.js +99 -0
  116. package/src/runtime/config-validator.js +121 -0
  117. package/src/runtime/context-ledger.js +360 -0
  118. package/src/runtime/cutover-readiness.js +42 -0
  119. package/src/runtime/daemon.js +729 -0
  120. package/src/runtime/delivery-ack.js +195 -0
  121. package/src/runtime/delivery-adapters/local-file.js +41 -0
  122. package/src/runtime/delivery-adapters/openclaw-cli.js +94 -0
  123. package/src/runtime/delivery-adapters/openclaw-peer.js +98 -0
  124. package/src/runtime/delivery-adapters/shadow.js +13 -0
  125. package/src/runtime/delivery-adapters/standalone-http.js +98 -0
  126. package/src/runtime/delivery-adapters/telegram.js +104 -0
  127. package/src/runtime/delivery-adapters/tui.js +128 -0
  128. package/src/runtime/delivery-manager.js +807 -0
  129. package/src/runtime/delivery-store.js +168 -0
  130. package/src/runtime/dependency-health.js +118 -0
  131. package/src/runtime/envelope.js +114 -0
  132. package/src/runtime/evaluation.js +1089 -0
  133. package/src/runtime/exec-approvals.js +216 -0
  134. package/src/runtime/executor.js +500 -0
  135. package/src/runtime/failure-ping.js +67 -0
  136. package/src/runtime/flows.js +83 -0
  137. package/src/runtime/guards.js +45 -0
  138. package/src/runtime/handoff.js +51 -0
  139. package/src/runtime/identity-cache.js +28 -0
  140. package/src/runtime/improvement-engine.js +109 -0
  141. package/src/runtime/improvement-harness.js +581 -0
  142. package/src/runtime/input-sanitiser.js +72 -0
  143. package/src/runtime/interaction-contract.js +347 -0
  144. package/src/runtime/lane-readiness.js +226 -0
  145. package/src/runtime/migration.js +323 -0
  146. package/src/runtime/model-resolution.js +78 -0
  147. package/src/runtime/network.js +64 -0
  148. package/src/runtime/notification-store.js +97 -0
  149. package/src/runtime/notifier.js +256 -0
  150. package/src/runtime/orchestrator.js +53 -0
  151. package/src/runtime/orphan-reaper.js +41 -0
  152. package/src/runtime/output-contract-schema.js +139 -0
  153. package/src/runtime/output-contract-validator.js +439 -0
  154. package/src/runtime/peer-readiness.js +69 -0
  155. package/src/runtime/peer-registry.js +133 -0
  156. package/src/runtime/pilot-status.js +108 -0
  157. package/src/runtime/prompt-builder.js +261 -0
  158. package/src/runtime/provider-attempt.js +582 -0
  159. package/src/runtime/report-fallback.js +71 -0
  160. package/src/runtime/result-normalizer.js +183 -0
  161. package/src/runtime/retention.js +74 -0
  162. package/src/runtime/review.js +244 -0
  163. package/src/runtime/route-job.js +15 -0
  164. package/src/runtime/run-store.js +38 -0
  165. package/src/runtime/schedule.js +88 -0
  166. package/src/runtime/scheduler-state.js +434 -0
  167. package/src/runtime/scheduler.js +656 -0
  168. package/src/runtime/session-compactor.js +182 -0
  169. package/src/runtime/session-search.js +155 -0
  170. package/src/runtime/slack-inbound.js +249 -0
  171. package/src/runtime/ssrf.js +102 -0
  172. package/src/runtime/status-aggregator.js +330 -0
  173. package/src/runtime/task-contract.js +140 -0
  174. package/src/runtime/task-packet.js +107 -0
  175. package/src/runtime/task-router.js +140 -0
  176. package/src/runtime/telegram-inbound.js +1565 -0
  177. package/src/runtime/token-counter.js +134 -0
  178. package/src/runtime/token-estimator.js +59 -0
  179. package/src/runtime/tool-loop.js +200 -0
  180. package/src/runtime/transport-server.js +311 -0
  181. package/src/runtime/tui-server.js +411 -0
  182. package/src/runtime/ulid.js +44 -0
  183. package/src/security/ssrf-check.js +197 -0
  184. package/src/setup.js +369 -0
  185. package/src/shadow/bridge.js +303 -0
  186. package/src/skills/loader.js +84 -0
  187. package/src/tools/catalog.json +49 -0
  188. package/src/tools/cli-delegate.js +44 -0
  189. package/src/tools/mcp-client.js +106 -0
  190. package/src/tools/micro/cancel-task.js +6 -0
  191. package/src/tools/micro/complete-task.js +6 -0
  192. package/src/tools/micro/fail-task.js +6 -0
  193. package/src/tools/micro/http-fetch.js +74 -0
  194. package/src/tools/micro/index.js +36 -0
  195. package/src/tools/micro/lcm-recall.js +60 -0
  196. package/src/tools/micro/list-dir.js +17 -0
  197. package/src/tools/micro/list-skills.js +46 -0
  198. package/src/tools/micro/load-skill.js +38 -0
  199. package/src/tools/micro/memory-search.js +45 -0
  200. package/src/tools/micro/read-file.js +11 -0
  201. package/src/tools/micro/session-search.js +54 -0
  202. package/src/tools/micro/shell-exec.js +43 -0
  203. package/src/tools/micro/trigger-job.js +79 -0
  204. package/src/tools/micro/web-search.js +58 -0
  205. package/src/tools/micro/workspace-paths.js +39 -0
  206. package/src/tools/micro/write-file.js +14 -0
  207. package/src/tools/micro/write-memory.js +41 -0
  208. package/src/tools/registry.js +348 -0
  209. package/src/tools/tool-result-contract.js +36 -0
  210. package/src/tui/chat.js +835 -0
  211. package/src/tui/renderer.js +175 -0
  212. package/src/tui/socket-client.js +217 -0
  213. package/src/utils/canonical-json.js +29 -0
  214. package/src/utils/compaction.js +30 -0
  215. package/src/utils/env-loader.js +5 -0
  216. package/src/utils/errors.js +80 -0
  217. package/src/utils/fs.js +101 -0
  218. package/src/utils/ids.js +5 -0
  219. package/src/utils/model-context-limits.js +30 -0
  220. package/src/utils/token-budget.js +74 -0
  221. package/src/utils/usage-cost.js +25 -0
  222. package/src/utils/usage-metrics.js +14 -0
  223. package/vendor/smol-toml-1.5.2.tgz +0 -0
@@ -0,0 +1,582 @@
1
+ import { downloadTelegramFile } from "./telegram-inbound.js";
2
+ import { ModelRouter } from "../providers/router.js";
3
+ import { assertProviderExecutionAllowed } from "./guards.js";
4
+ import { compileOutputContractSchema } from "./output-contract-schema.js";
5
+ import { estimateInvocationTokens } from "./token-estimator.js";
6
+ import { TokenCounter } from "./token-counter.js";
7
+ import { classifyRuntimeFailure, getReportFallbackPolicy, resolveReportFallback } from "./report-fallback.js";
8
+ import { extractUsageMetrics } from "../utils/usage-metrics.js";
9
+
10
+ export function modelToProviderId(modelId) {
11
+ return String(modelId || "").split("/")[0] || null;
12
+ }
13
+
14
+ export function isRetryableError(err) {
15
+ const message = (err.message || "").toLowerCase();
16
+ const statusCode = err.statusCode || err.status || 0;
17
+
18
+ if (
19
+ message.includes("econnrefused") ||
20
+ message.includes("etimedout") ||
21
+ message.includes("fetch failed") ||
22
+ message.includes("net_error") ||
23
+ message.includes("timeout") ||
24
+ message.includes("enotfound") ||
25
+ message.includes("eai_again")
26
+ ) {
27
+ return true;
28
+ }
29
+
30
+ if (statusCode === 429 || (statusCode >= 500 && statusCode < 600)) {
31
+ return true;
32
+ }
33
+
34
+ return false;
35
+ }
36
+
37
+ export function computeProviderTimeoutMs(plan, providerConfig, options = {}) {
38
+ if (options.providerTimeoutMs != null) {
39
+ return Number(options.providerTimeoutMs);
40
+ }
41
+
42
+ const defaultTimeoutMs = Number(providerConfig?.defaultTimeoutMs || 0);
43
+ const budgetSeconds = Number(plan?.job?.budget?.maxRuntimeSeconds || 0);
44
+ const budgetTimeoutMs = budgetSeconds ? Math.min((budgetSeconds + 5) * 1000, 60000) : 0;
45
+ return Math.max(defaultTimeoutMs, budgetTimeoutMs || 0);
46
+ }
47
+
48
+ export function buildRoutingDecision(plan, options = {}) {
49
+ const routeMode = options.routeMode || plan.routing?.routeMode || "primary";
50
+ const selectedLane = options.laneOverride || plan.routing?.selectedLane || plan.job.modelLane;
51
+ return {
52
+ requestedLane: plan.job.modelLane,
53
+ selectedLane,
54
+ routeMode,
55
+ matchedRule: plan.routing?.matchedRule || null,
56
+ reasons: plan.routing?.reasons || [],
57
+ modelOverride: options.modelOverride || null
58
+ };
59
+ }
60
+
61
+ export function getLocalPromptContractOutputCap(plan, { providerId, providerCapabilities, routingDecision }) {
62
+ if (providerId !== "ollama") return null;
63
+ if (providerCapabilities?.structuredOutputMode !== "prompt_contract") return null;
64
+
65
+ const format = plan?.packet?.layers?.outputContract?.format || null;
66
+ if (format === "bulleted_briefing") return 1500;
67
+ if (format === "structured_rollup") return 2000;
68
+
69
+ if (routingDecision?.selectedLane === "local_cheap") return 400;
70
+ if (routingDecision?.selectedLane === "local_report") return 1200;
71
+ return null;
72
+ }
73
+
74
+ export async function prepareProviderAttempt({
75
+ plan,
76
+ runtimeConfig,
77
+ registry,
78
+ tokenCounter,
79
+ modelId,
80
+ providerConfig,
81
+ providerId,
82
+ routingDecision,
83
+ providerTimeoutMs,
84
+ toolSchemas,
85
+ buildSystemPrompt,
86
+ buildUserMessage
87
+ }) {
88
+ if (!providerConfig) {
89
+ throw new Error(`No provider config for model ${modelId}`);
90
+ }
91
+ const adapter = registry.create(providerConfig);
92
+ const providerCapabilities = adapter?.getCapabilities?.() || null;
93
+ const nativeStructuredOutput = Boolean(
94
+ adapter &&
95
+ plan.packet.layers.outputContract &&
96
+ typeof adapter.supportsNativeStructuredOutput === "function" &&
97
+ adapter.supportsNativeStructuredOutput()
98
+ );
99
+ const responseSchema = nativeStructuredOutput
100
+ ? compileOutputContractSchema(plan.packet.layers.outputContract, {
101
+ thoughtFirst: providerCapabilities?.supportsReasoningSchema === true
102
+ })
103
+ : null;
104
+
105
+ const localPromptContractCap = getLocalPromptContractOutputCap(plan, {
106
+ providerId,
107
+ providerCapabilities,
108
+ routingDecision
109
+ });
110
+ const effectiveMaxTokens = localPromptContractCap
111
+ ? Math.min(Number(plan.job.budget.maxTokens || 0) || 0, localPromptContractCap)
112
+ : plan.job.budget.maxTokens;
113
+
114
+ const invocation = {
115
+ model: modelId,
116
+ system: buildSystemPrompt(plan, {
117
+ nativeStructuredOutput,
118
+ responseSchema,
119
+ toolSchemas
120
+ }),
121
+ messages: [
122
+ {
123
+ role: "user",
124
+ content: buildUserMessage(plan, {
125
+ nativeStructuredOutput,
126
+ responseSchema
127
+ })
128
+ }
129
+ ],
130
+ maxTokens: effectiveMaxTokens,
131
+ responseSchema,
132
+ timeoutMs: providerTimeoutMs,
133
+ tools: toolSchemas?.length ? toolSchemas : undefined,
134
+ options:
135
+ providerId === "ollama"
136
+ ? {
137
+ num_predict: effectiveMaxTokens
138
+ }
139
+ : undefined
140
+ };
141
+
142
+ const thinkMode = plan?.packet?.thinkMode;
143
+ if (
144
+ thinkMode && thinkMode !== "off" &&
145
+ providerId === "anthropic" &&
146
+ process.env.ANTHROPIC_THINKING_ENABLED === "true"
147
+ ) {
148
+ const THINK_BUDGETS = { low: 1000, medium: 8000, high: 16000 };
149
+ const budget = THINK_BUDGETS[thinkMode] || 8000;
150
+ invocation.betas = [...(invocation.betas || []), "interleaved-thinking-2025-05-14"];
151
+ invocation.thinking = { type: "enabled", budget_tokens: budget };
152
+ }
153
+
154
+ const preflight = await buildPreflight(runtimeConfig, invocation, {
155
+ providerId,
156
+ adapter,
157
+ tokenCounter
158
+ });
159
+
160
+ if (preflight.pressure === "hard") {
161
+ throw new Error(
162
+ `Preflight blocked ${plan.job.id}: estimated prompt tokens ${preflight.estimatedPromptTokens} exceed hard limit ${preflight.hardLimit}`
163
+ );
164
+ }
165
+
166
+ return {
167
+ adapter,
168
+ providerCapabilities,
169
+ invocation,
170
+ preflight
171
+ };
172
+ }
173
+
174
+ export async function buildPreflight(runtimeConfig, invocation, options = {}) {
175
+ const contextTokens = runtimeConfig?.safety?.contextTokens ?? 32768;
176
+ const softRatio = runtimeConfig?.safety?.contextPressureSoftRatio ?? 0.72;
177
+ const hardRatio = runtimeConfig?.safety?.contextPressureHardRatio ?? 0.9;
178
+ const freshSessionOnHighPressure = runtimeConfig?.safety?.freshSessionOnHighPressure ?? true;
179
+ const snapshotBeforeCompaction = runtimeConfig?.safety?.snapshotBeforeCompaction ?? true;
180
+ const tokenCounter = options.tokenCounter || new TokenCounter();
181
+ const tokenEstimate = await tokenCounter.countInvocation({
182
+ providerId: options.providerId,
183
+ invocation,
184
+ adapter: options.adapter
185
+ });
186
+ const heuristicEstimate = tokenEstimate.mode === "heuristic" ? tokenEstimate.details : estimateInvocationTokens(invocation);
187
+ const estimatedPromptTokens = tokenEstimate.total;
188
+ const softLimit = Math.floor(contextTokens * softRatio);
189
+ const hardLimit = Math.floor(contextTokens * hardRatio);
190
+
191
+ let pressure = "low";
192
+ if (estimatedPromptTokens >= hardLimit) pressure = "hard";
193
+ else if (estimatedPromptTokens >= softLimit) pressure = "high";
194
+
195
+ return {
196
+ contextTokens,
197
+ estimatedPromptTokens,
198
+ tokenEstimate,
199
+ heuristicEstimate,
200
+ softLimit,
201
+ hardLimit,
202
+ pressure,
203
+ freshSessionRequired: pressure !== "low" && freshSessionOnHighPressure,
204
+ snapshotBeforeCompaction
205
+ };
206
+ }
207
+
208
+ async function attachVisionInputs(plan, runtimeConfig, invocation, providerCapabilities) {
209
+ if (!plan.packet?.imageRefs?.length || !invocation) {
210
+ return invocation;
211
+ }
212
+
213
+ if (providerCapabilities?.supportsVision) {
214
+ const tgConfig = runtimeConfig?.telegram;
215
+ const botToken = tgConfig?.botTokenEnv ? process.env[tgConfig.botTokenEnv] : null;
216
+ if (!botToken) {
217
+ console.warn(`[executor] imageRefs present but botToken not resolved from ${tgConfig?.botTokenEnv || "undefined env key"}`);
218
+ return invocation;
219
+ }
220
+
221
+ const imageBlocks = [];
222
+ for (const ref of plan.packet.imageRefs) {
223
+ const downloaded = await downloadTelegramFile(ref.fileId, botToken);
224
+ if (downloaded) {
225
+ imageBlocks.push({
226
+ type: "image",
227
+ source: {
228
+ type: "base64",
229
+ media_type: downloaded.mediaType,
230
+ data: downloaded.base64,
231
+ },
232
+ });
233
+ }
234
+ }
235
+
236
+ if (imageBlocks.length > 0) {
237
+ const userIdx = invocation.messages.findLastIndex((message) => message.role === "user");
238
+ if (userIdx !== -1) {
239
+ const textContent = invocation.messages[userIdx].content;
240
+ invocation.messages[userIdx].content = [
241
+ ...imageBlocks,
242
+ { type: "text", text: textContent },
243
+ ];
244
+ }
245
+ }
246
+ return invocation;
247
+ }
248
+
249
+ const visionNote = "[Image received but this model doesn't support vision]";
250
+ const userIdx = invocation.messages.findLastIndex((message) => message.role === "user");
251
+ if (userIdx !== -1) {
252
+ const existing = invocation.messages[userIdx].content;
253
+ invocation.messages[userIdx].content = existing
254
+ ? `${existing}\n\n${visionNote}`
255
+ : visionNote;
256
+ }
257
+ return invocation;
258
+ }
259
+
260
+ function annotateAttemptError(error, metadata = {}) {
261
+ if (!error || typeof error !== "object") {
262
+ return error;
263
+ }
264
+
265
+ Object.assign(error, metadata);
266
+ return error;
267
+ }
268
+
269
+ async function executeProviderCall({
270
+ plan,
271
+ runtime,
272
+ mode,
273
+ registry,
274
+ tokenCounter,
275
+ modelId,
276
+ providerId,
277
+ providerConfig,
278
+ routingDecision,
279
+ providerTimeoutMs,
280
+ toolSchemas,
281
+ buildSystemPrompt,
282
+ buildUserMessage,
283
+ onPrepared
284
+ }) {
285
+ let prepared = null;
286
+ let invocation = null;
287
+
288
+ try {
289
+ prepared = await prepareProviderAttempt({
290
+ plan,
291
+ runtimeConfig: runtime.runtime,
292
+ registry,
293
+ tokenCounter,
294
+ modelId,
295
+ providerConfig,
296
+ providerId,
297
+ routingDecision,
298
+ providerTimeoutMs,
299
+ toolSchemas,
300
+ buildSystemPrompt,
301
+ buildUserMessage
302
+ });
303
+
304
+ if (typeof onPrepared === "function") {
305
+ onPrepared(prepared);
306
+ }
307
+
308
+ invocation = await attachVisionInputs(
309
+ plan,
310
+ runtime.runtime,
311
+ prepared.invocation,
312
+ prepared.providerCapabilities
313
+ );
314
+
315
+ if (mode === "dry-run") {
316
+ return {
317
+ response: null,
318
+ providerId,
319
+ modelId,
320
+ usage: {
321
+ tokensIn: 0,
322
+ tokensOut: 0,
323
+ cacheIn: 0,
324
+ cacheCreation: 0,
325
+ },
326
+ cached: false,
327
+ adapter: prepared.adapter,
328
+ providerCapabilities: prepared.providerCapabilities,
329
+ invocation,
330
+ preflight: prepared.preflight,
331
+ providerModePolicy: null,
332
+ health: null,
333
+ toolLoopEnabled: false
334
+ };
335
+ }
336
+
337
+ const providerModePolicy = assertProviderExecutionAllowed({
338
+ jobId: plan.job.id,
339
+ modelLane: routingDecision.selectedLane,
340
+ providerId,
341
+ interactive: plan.job.trigger === "interactive"
342
+ });
343
+
344
+ let health = null;
345
+ if (providerModePolicy.requireHealthyProvider) {
346
+ const healthCheck = await prepared.adapter.healthCheck();
347
+ if (!healthCheck.ok) {
348
+ throw new Error(`Provider health check failed for ${providerId} with status ${healthCheck.status}`);
349
+ }
350
+ health = healthCheck;
351
+ }
352
+
353
+ const response = await prepared.adapter.invoke(invocation);
354
+ const usage = extractUsageMetrics(response);
355
+
356
+ return {
357
+ response,
358
+ providerId,
359
+ modelId,
360
+ usage,
361
+ cached: Boolean(usage.cacheIn || usage.cacheCreation),
362
+ adapter: prepared.adapter,
363
+ providerCapabilities: prepared.providerCapabilities,
364
+ invocation,
365
+ preflight: prepared.preflight,
366
+ providerModePolicy,
367
+ health,
368
+ toolLoopEnabled: true
369
+ };
370
+ } catch (error) {
371
+ throw annotateAttemptError(error, {
372
+ providerId,
373
+ modelId,
374
+ routingDecision,
375
+ providerCapabilities: prepared?.providerCapabilities || null,
376
+ invocation: invocation || prepared?.invocation || null,
377
+ preflight: prepared?.preflight || null
378
+ });
379
+ }
380
+ }
381
+
382
+ function buildFallbackState(runtimeConfig, routingDecision, providerId, modelId, options) {
383
+ return {
384
+ allowed: false,
385
+ attempted: false,
386
+ trigger: null,
387
+ finalSourceLane: routingDecision.selectedLane,
388
+ sourceLane: routingDecision.selectedLane,
389
+ sourceProviderId: providerId,
390
+ sourceModelId: modelId,
391
+ policy: getReportFallbackPolicy(runtimeConfig, options)
392
+ };
393
+ }
394
+
395
+ export async function attemptProvider({ plan, runtime, options = {} }) {
396
+ const mode = options.mode || "dry-run";
397
+ const router = options.router || new ModelRouter(runtime.router);
398
+ const routingDecision = buildRoutingDecision(plan, options);
399
+ const laneConfig = runtime.router?.[routingDecision.selectedLane];
400
+ const primaryModelId = options.modelOverride || plan.packet.modelOverride || router.resolve(routingDecision.selectedLane, routingDecision.routeMode);
401
+ const providersToTry = [primaryModelId, ...(laneConfig?.fallbackModels || [])];
402
+ const toolSchemas = options.toolSchemas || [];
403
+ const registry = options.registry;
404
+ const tokenCounter = options.tokenCounter;
405
+ const buildSystemPrompt = options.buildSystemPrompt;
406
+ const buildUserMessage = options.buildUserMessage;
407
+
408
+ let fallback = null;
409
+ let primaryError = null;
410
+ let lastProviderId = null;
411
+
412
+ for (const currentModelId of providersToTry) {
413
+ const currentProviderId = modelToProviderId(currentModelId);
414
+ const providerConfig = runtime.providers[currentProviderId];
415
+ const providerTimeoutMs = computeProviderTimeoutMs(plan, providerConfig, options);
416
+ const breaker = options.getBreaker?.(currentModelId, runtime.runtime) || null;
417
+ lastProviderId = currentProviderId;
418
+
419
+ if (breaker?.isOpen()) {
420
+ const retryAfter = breaker.retryAfter();
421
+ console.warn(`[Nemoris] circuit breaker open for ${currentModelId}, skipping (retry in ${Math.ceil(retryAfter)}s)`);
422
+ primaryError = new Error(`Provider ${currentModelId} circuit open — retry after ${Math.ceil(retryAfter)}s`);
423
+ annotateAttemptError(primaryError, {
424
+ providerId: currentProviderId,
425
+ modelId: currentModelId,
426
+ routingDecision,
427
+ fallback
428
+ });
429
+ continue;
430
+ }
431
+
432
+ try {
433
+ const attempt = await executeProviderCall({
434
+ plan,
435
+ runtime,
436
+ mode,
437
+ registry,
438
+ tokenCounter,
439
+ modelId: currentModelId,
440
+ providerId: currentProviderId,
441
+ providerConfig,
442
+ routingDecision,
443
+ providerTimeoutMs,
444
+ toolSchemas,
445
+ buildSystemPrompt,
446
+ buildUserMessage,
447
+ onPrepared: () => {
448
+ if (!fallback) {
449
+ fallback = buildFallbackState(runtime.runtime, routingDecision, currentProviderId, currentModelId, options);
450
+ }
451
+ }
452
+ });
453
+
454
+ if (mode === "provider") {
455
+ breaker?.recordSuccess();
456
+ }
457
+
458
+ return {
459
+ ...attempt,
460
+ routingDecision,
461
+ fallback,
462
+ primaryModelId
463
+ };
464
+ } catch (err) {
465
+ primaryError = annotateAttemptError(err, {
466
+ providerId: currentProviderId,
467
+ modelId: currentModelId,
468
+ routingDecision,
469
+ fallback
470
+ });
471
+ const statusCode = err.statusCode || err.status || 0;
472
+ breaker?.recordFailure(statusCode);
473
+
474
+ if (isRetryableError(err)) {
475
+ console.warn(`[executor] provider ${currentModelId} failed: ${err.message}, trying next`);
476
+ continue;
477
+ }
478
+ break;
479
+ }
480
+ }
481
+
482
+ if (!primaryError) {
483
+ primaryError = new Error("All providers in failover chain exhausted");
484
+ annotateAttemptError(primaryError, {
485
+ routingDecision,
486
+ fallback
487
+ });
488
+ }
489
+
490
+ const failureClass = classifyRuntimeFailure(primaryError?.message || "");
491
+ const fallbackResolution = resolveReportFallback({
492
+ runtimeConfig: runtime.runtime,
493
+ job: plan.job,
494
+ routingDecision,
495
+ providerId: lastProviderId,
496
+ failureClass,
497
+ options
498
+ });
499
+
500
+ fallback = {
501
+ ...(fallback || {}),
502
+ allowed: fallbackResolution.allowed,
503
+ attempted: false,
504
+ trigger: failureClass,
505
+ localFailureClass: failureClass,
506
+ localError: primaryError.message,
507
+ blockedReason: fallbackResolution.allowed ? null : fallbackResolution.reason,
508
+ targetLane: fallbackResolution.targetLane || null
509
+ };
510
+
511
+ if (!fallbackResolution.allowed) {
512
+ annotateAttemptError(primaryError, {
513
+ providerId: primaryError.providerId || lastProviderId,
514
+ routingDecision,
515
+ fallback
516
+ });
517
+ throw primaryError;
518
+ }
519
+
520
+ fallback.attempted = true;
521
+ const fallbackRoutingDecision = {
522
+ ...routingDecision,
523
+ selectedLane: fallbackResolution.targetLane,
524
+ routeMode: "fallback",
525
+ reasons: [...(routingDecision.reasons || []), `fallback:${failureClass}`],
526
+ description: "Failure-triggered report fallback."
527
+ };
528
+ const fallbackModelId = router.resolve(fallbackResolution.targetLane, "primary");
529
+ const fallbackProviderId = modelToProviderId(fallbackModelId);
530
+ const fallbackProviderConfig = runtime.providers[fallbackProviderId];
531
+
532
+ try {
533
+ const attempt = await executeProviderCall({
534
+ plan,
535
+ runtime,
536
+ mode,
537
+ registry,
538
+ tokenCounter,
539
+ modelId: fallbackModelId,
540
+ providerId: fallbackProviderId,
541
+ providerConfig: fallbackProviderConfig,
542
+ routingDecision: fallbackRoutingDecision,
543
+ providerTimeoutMs: computeProviderTimeoutMs(plan, fallbackProviderConfig, options),
544
+ toolSchemas,
545
+ buildSystemPrompt,
546
+ buildUserMessage
547
+ });
548
+
549
+ return {
550
+ ...attempt,
551
+ routingDecision: fallbackRoutingDecision,
552
+ fallback: {
553
+ ...fallback,
554
+ success: true,
555
+ finalSourceLane: fallbackRoutingDecision.selectedLane,
556
+ finalProviderId: fallbackProviderId,
557
+ finalModelId: fallbackModelId
558
+ },
559
+ toolLoopEnabled: mode === "provider" && Boolean(options.allowToolLoopOnFallback)
560
+ };
561
+ } catch (fallbackError) {
562
+ fallback = {
563
+ ...fallback,
564
+ success: false,
565
+ fallbackFailureClass: classifyRuntimeFailure(fallbackError?.message || ""),
566
+ fallbackError: fallbackError.message
567
+ };
568
+ const combinedError = new Error(
569
+ `Primary provider failed (${failureClass}) and fallback failed: ${fallbackError.message}`
570
+ );
571
+ annotateAttemptError(combinedError, {
572
+ providerId: fallbackProviderId,
573
+ modelId: fallbackModelId,
574
+ routingDecision: fallbackRoutingDecision,
575
+ providerCapabilities: fallbackError?.providerCapabilities || null,
576
+ invocation: fallbackError?.invocation || null,
577
+ preflight: fallbackError?.preflight || null,
578
+ fallback
579
+ });
580
+ throw combinedError;
581
+ }
582
+ }
@@ -0,0 +1,71 @@
1
+ import { getProviderModePolicy } from "./guards.js";
2
+
3
+ function readFlag(name) {
4
+ const raw = process.env[name];
5
+ return raw === "1" || raw === "true";
6
+ }
7
+
8
+ export function classifyRuntimeFailure(message) {
9
+ const normalized = String(message || "").toLowerCase();
10
+ if (!normalized) return "unknown_failure";
11
+ if (normalized.includes("timed out")) return "timeout";
12
+ if (normalized.includes("loading model") || normalized.includes("server loading")) return "provider_loading";
13
+ if (normalized.includes("missing auth token") || normalized.includes("missing api key")) return "auth_missing";
14
+ if (normalized.includes("model") && normalized.includes("not found")) return "missing_model";
15
+ if (normalized.includes("structured") && normalized.includes("output")) return "structured_output_failure";
16
+ if (normalized.includes("provider error")) return "provider_error";
17
+ return "unknown_failure";
18
+ }
19
+
20
+ export function getReportFallbackPolicy(runtimeConfig = {}, options = {}) {
21
+ const configured = runtimeConfig?.reportFallback || {};
22
+ const envEnabled = readFlag("NEMORIS_ALLOW_REPORT_FALLBACK");
23
+ const allowReportFallback = Boolean(options.allowReportFallback || envEnabled || configured.enabled === true);
24
+
25
+ return {
26
+ enabled: allowReportFallback,
27
+ configEnabled: configured.enabled === true,
28
+ envEnabled,
29
+ overrideEnabled: Boolean(options.allowReportFallback),
30
+ lane: configured.lane || "report_fallback_lowcost",
31
+ allowedJobIds: configured.allowedJobIds || ["workspace-health"],
32
+ allowedFailureClasses: configured.allowedFailureClasses || ["timeout", "provider_loading"]
33
+ };
34
+ }
35
+
36
+ export function resolveReportFallback({ runtimeConfig, job, routingDecision, providerId, failureClass, options = {} }) {
37
+ const policy = getReportFallbackPolicy(runtimeConfig, options);
38
+ const jobPolicy = job?.reportFallback || null;
39
+
40
+ if (!jobPolicy?.enabled) {
41
+ return { allowed: false, policy, reason: "Job is not configured for report fallback." };
42
+ }
43
+
44
+ if (!policy.enabled) {
45
+ return { allowed: false, policy, reason: "Report fallback is disabled." };
46
+ }
47
+
48
+ if (!policy.allowedJobIds.includes(job.id)) {
49
+ return { allowed: false, policy, reason: `Job ${job.id} is not allowed to use report fallback.` };
50
+ }
51
+
52
+ if (!policy.allowedFailureClasses.includes(failureClass)) {
53
+ return { allowed: false, policy, reason: `Failure class ${failureClass} does not qualify for report fallback.` };
54
+ }
55
+
56
+ if (providerId !== "ollama" || routingDecision?.selectedLane !== "local_report") {
57
+ return { allowed: false, policy, reason: "Report fallback only applies after local_report Ollama failures." };
58
+ }
59
+
60
+ const providerModePolicy = getProviderModePolicy();
61
+ if (!providerModePolicy.allowRemoteProviders) {
62
+ return { allowed: false, policy, reason: "Remote provider execution is not enabled." };
63
+ }
64
+
65
+ return {
66
+ allowed: true,
67
+ policy,
68
+ targetLane: jobPolicy.lane || policy.lane,
69
+ trigger: failureClass
70
+ };
71
+ }