npm - fixo-cli - Versions diffs - 1.0.0 - Mend

fixo-cli 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (303) hide show

package/LICENSE +201 -0
package/README.md +530 -0
package/dist/agent/agent-client.d.ts +108 -0
package/dist/agent/agent-client.d.ts.map +1 -0
package/dist/agent/agent-client.js +1247 -0
package/dist/agent/agent-client.js.map +1 -0
package/dist/agent/agent-pool.d.ts +20 -0
package/dist/agent/agent-pool.d.ts.map +1 -0
package/dist/agent/agent-pool.js +217 -0
package/dist/agent/agent-pool.js.map +1 -0
package/dist/agent/background-awareness.d.ts +55 -0
package/dist/agent/background-awareness.d.ts.map +1 -0
package/dist/agent/background-awareness.js +104 -0
package/dist/agent/background-awareness.js.map +1 -0
package/dist/agent/command-parser.d.ts +33 -0
package/dist/agent/command-parser.d.ts.map +1 -0
package/dist/agent/command-parser.js +120 -0
package/dist/agent/command-parser.js.map +1 -0
package/dist/agent/context-budget.d.ts +91 -0
package/dist/agent/context-budget.d.ts.map +1 -0
package/dist/agent/context-budget.js +219 -0
package/dist/agent/context-budget.js.map +1 -0
package/dist/agent/conversation.d.ts +190 -0
package/dist/agent/conversation.d.ts.map +1 -0
package/dist/agent/conversation.js +547 -0
package/dist/agent/conversation.js.map +1 -0
package/dist/agent/hooks.d.ts +72 -0
package/dist/agent/hooks.d.ts.map +1 -0
package/dist/agent/hooks.js +214 -0
package/dist/agent/hooks.js.map +1 -0
package/dist/agent/mcp-bridge.d.ts +13 -0
package/dist/agent/mcp-bridge.d.ts.map +1 -0
package/dist/agent/mcp-bridge.js +86 -0
package/dist/agent/mcp-bridge.js.map +1 -0
package/dist/agent/mcp-client.d.ts +24 -0
package/dist/agent/mcp-client.d.ts.map +1 -0
package/dist/agent/mcp-client.js +146 -0
package/dist/agent/mcp-client.js.map +1 -0
package/dist/agent/mcp-manager.d.ts +13 -0
package/dist/agent/mcp-manager.d.ts.map +1 -0
package/dist/agent/mcp-manager.js +84 -0
package/dist/agent/mcp-manager.js.map +1 -0
package/dist/agent/mcp-registry.d.ts +45 -0
package/dist/agent/mcp-registry.d.ts.map +1 -0
package/dist/agent/mcp-registry.js +98 -0
package/dist/agent/mcp-registry.js.map +1 -0
package/dist/agent/orchestrator.d.ts +14 -0
package/dist/agent/orchestrator.d.ts.map +1 -0
package/dist/agent/orchestrator.js +118 -0
package/dist/agent/orchestrator.js.map +1 -0
package/dist/agent/parser-adapter.d.ts +120 -0
package/dist/agent/parser-adapter.d.ts.map +1 -0
package/dist/agent/parser-adapter.js +265 -0
package/dist/agent/parser-adapter.js.map +1 -0
package/dist/agent/parsers/imports.d.ts +11 -0
package/dist/agent/parsers/imports.d.ts.map +1 -0
package/dist/agent/parsers/imports.js +94 -0
package/dist/agent/parsers/imports.js.map +1 -0
package/dist/agent/parsers/shell.d.ts +23 -0
package/dist/agent/parsers/shell.d.ts.map +1 -0
package/dist/agent/parsers/shell.js +200 -0
package/dist/agent/parsers/shell.js.map +1 -0
package/dist/agent/parsers/symbols.d.ts +17 -0
package/dist/agent/parsers/symbols.d.ts.map +1 -0
package/dist/agent/parsers/symbols.js +103 -0
package/dist/agent/parsers/symbols.js.map +1 -0
package/dist/agent/permissions.d.ts +65 -0
package/dist/agent/permissions.d.ts.map +1 -0
package/dist/agent/permissions.js +219 -0
package/dist/agent/permissions.js.map +1 -0
package/dist/agent/predictive-gate.d.ts +69 -0
package/dist/agent/predictive-gate.d.ts.map +1 -0
package/dist/agent/predictive-gate.js +128 -0
package/dist/agent/predictive-gate.js.map +1 -0
package/dist/agent/provider-cooldown.d.ts +144 -0
package/dist/agent/provider-cooldown.d.ts.map +1 -0
package/dist/agent/provider-cooldown.js +300 -0
package/dist/agent/provider-cooldown.js.map +1 -0
package/dist/agent/providers-manager.d.ts +109 -0
package/dist/agent/providers-manager.d.ts.map +1 -0
package/dist/agent/providers-manager.js +464 -0
package/dist/agent/providers-manager.js.map +1 -0
package/dist/agent/repo-map.d.ts +6 -0
package/dist/agent/repo-map.d.ts.map +1 -0
package/dist/agent/repo-map.js +221 -0
package/dist/agent/repo-map.js.map +1 -0
package/dist/agent/retry.d.ts +103 -0
package/dist/agent/retry.d.ts.map +1 -0
package/dist/agent/retry.js +276 -0
package/dist/agent/retry.js.map +1 -0
package/dist/agent/search/index.d.ts +61 -0
package/dist/agent/search/index.d.ts.map +1 -0
package/dist/agent/search/index.js +314 -0
package/dist/agent/search/index.js.map +1 -0
package/dist/agent/single-agent.d.ts +76 -0
package/dist/agent/single-agent.d.ts.map +1 -0
package/dist/agent/single-agent.js +697 -0
package/dist/agent/single-agent.js.map +1 -0
package/dist/agent/skills.d.ts +22 -0
package/dist/agent/skills.d.ts.map +1 -0
package/dist/agent/skills.js +139 -0
package/dist/agent/skills.js.map +1 -0
package/dist/agent/stream-glue.d.ts +85 -0
package/dist/agent/stream-glue.d.ts.map +1 -0
package/dist/agent/stream-glue.js +120 -0
package/dist/agent/stream-glue.js.map +1 -0
package/dist/agent/subagent.d.ts +72 -0
package/dist/agent/subagent.d.ts.map +1 -0
package/dist/agent/subagent.js +193 -0
package/dist/agent/subagent.js.map +1 -0
package/dist/agent/telemetry.d.ts +192 -0
package/dist/agent/telemetry.d.ts.map +1 -0
package/dist/agent/telemetry.js +400 -0
package/dist/agent/telemetry.js.map +1 -0
package/dist/agent/tokenizer.d.ts +42 -0
package/dist/agent/tokenizer.d.ts.map +1 -0
package/dist/agent/tokenizer.js +107 -0
package/dist/agent/tokenizer.js.map +1 -0
package/dist/agent/tool-executor.d.ts +289 -0
package/dist/agent/tool-executor.d.ts.map +1 -0
package/dist/agent/tool-executor.js +2519 -0
package/dist/agent/tool-executor.js.map +1 -0
package/dist/agent/web-impl.d.ts +2 -0
package/dist/agent/web-impl.d.ts.map +1 -0
package/dist/agent/web-impl.js +34 -0
package/dist/agent/web-impl.js.map +1 -0
package/dist/agent/web.d.ts +8 -0
package/dist/agent/web.d.ts.map +1 -0
package/dist/agent/web.js +8 -0
package/dist/agent/web.js.map +1 -0
package/dist/agent/worker-agent.d.ts +27 -0
package/dist/agent/worker-agent.d.ts.map +1 -0
package/dist/agent/worker-agent.js +503 -0
package/dist/agent/worker-agent.js.map +1 -0
package/dist/config.d.ts +162 -0
package/dist/config.d.ts.map +1 -0
package/dist/config.js +138 -0
package/dist/config.js.map +1 -0
package/dist/context/fixo-md-watcher.d.ts +42 -0
package/dist/context/fixo-md-watcher.d.ts.map +1 -0
package/dist/context/fixo-md-watcher.js +126 -0
package/dist/context/fixo-md-watcher.js.map +1 -0
package/dist/context/fixo-md.d.ts +50 -0
package/dist/context/fixo-md.d.ts.map +1 -0
package/dist/context/fixo-md.js +118 -0
package/dist/context/fixo-md.js.map +1 -0
package/dist/context/todo.d.ts +65 -0
package/dist/context/todo.d.ts.map +1 -0
package/dist/context/todo.js +194 -0
package/dist/context/todo.js.map +1 -0
package/dist/git/git-manager.d.ts +33 -0
package/dist/git/git-manager.d.ts.map +1 -0
package/dist/git/git-manager.js +293 -0
package/dist/git/git-manager.js.map +1 -0
package/dist/git/git-ops.d.ts +10 -0
package/dist/git/git-ops.d.ts.map +1 -0
package/dist/git/git-ops.js +131 -0
package/dist/git/git-ops.js.map +1 -0
package/dist/index.d.ts +3 -0
package/dist/index.d.ts.map +1 -0
package/dist/index.js +352 -0
package/dist/index.js.map +1 -0
package/dist/indexer.d.ts +30 -0
package/dist/indexer.d.ts.map +1 -0
package/dist/indexer.js +273 -0
package/dist/indexer.js.map +1 -0
package/dist/lsp/lsp-client.d.ts +24 -0
package/dist/lsp/lsp-client.d.ts.map +1 -0
package/dist/lsp/lsp-client.js +205 -0
package/dist/lsp/lsp-client.js.map +1 -0
package/dist/lsp/lsp-manager.d.ts +17 -0
package/dist/lsp/lsp-manager.d.ts.map +1 -0
package/dist/lsp/lsp-manager.js +154 -0
package/dist/lsp/lsp-manager.js.map +1 -0
package/dist/lsp/lsp-pre-save.d.ts +137 -0
package/dist/lsp/lsp-pre-save.d.ts.map +1 -0
package/dist/lsp/lsp-pre-save.js +245 -0
package/dist/lsp/lsp-pre-save.js.map +1 -0
package/dist/lsp/syntax-fallback.d.ts +83 -0
package/dist/lsp/syntax-fallback.d.ts.map +1 -0
package/dist/lsp/syntax-fallback.js +275 -0
package/dist/lsp/syntax-fallback.js.map +1 -0
package/dist/model-outcomes.d.ts +12 -0
package/dist/model-outcomes.d.ts.map +1 -0
package/dist/model-outcomes.js +46 -0
package/dist/model-outcomes.js.map +1 -0
package/dist/planner.d.ts +32 -0
package/dist/planner.d.ts.map +1 -0
package/dist/planner.js +163 -0
package/dist/planner.js.map +1 -0
package/dist/project-memory.d.ts +29 -0
package/dist/project-memory.d.ts.map +1 -0
package/dist/project-memory.js +349 -0
package/dist/project-memory.js.map +1 -0
package/dist/review.d.ts +2 -0
package/dist/review.d.ts.map +1 -0
package/dist/review.js +61 -0
package/dist/review.js.map +1 -0
package/dist/runtime/background-jobs.d.ts +97 -0
package/dist/runtime/background-jobs.d.ts.map +1 -0
package/dist/runtime/background-jobs.js +331 -0
package/dist/runtime/background-jobs.js.map +1 -0
package/dist/runtime/credential-vault.d.ts +124 -0
package/dist/runtime/credential-vault.d.ts.map +1 -0
package/dist/runtime/credential-vault.js +184 -0
package/dist/runtime/credential-vault.js.map +1 -0
package/dist/runtime/loop-trap.d.ts +197 -0
package/dist/runtime/loop-trap.d.ts.map +1 -0
package/dist/runtime/loop-trap.js +420 -0
package/dist/runtime/loop-trap.js.map +1 -0
package/dist/runtime/policy.d.ts +15 -0
package/dist/runtime/policy.d.ts.map +1 -0
package/dist/runtime/policy.js +60 -0
package/dist/runtime/policy.js.map +1 -0
package/dist/runtime/redaction.d.ts +66 -0
package/dist/runtime/redaction.d.ts.map +1 -0
package/dist/runtime/redaction.js +155 -0
package/dist/runtime/redaction.js.map +1 -0
package/dist/runtime/session-snapshots.d.ts +76 -0
package/dist/runtime/session-snapshots.d.ts.map +1 -0
package/dist/runtime/session-snapshots.js +166 -0
package/dist/runtime/session-snapshots.js.map +1 -0
package/dist/runtime/staging.d.ts +205 -0
package/dist/runtime/staging.d.ts.map +1 -0
package/dist/runtime/staging.js +526 -0
package/dist/runtime/staging.js.map +1 -0
package/dist/runtime/task-session.d.ts +95 -0
package/dist/runtime/task-session.d.ts.map +1 -0
package/dist/runtime/task-session.js +263 -0
package/dist/runtime/task-session.js.map +1 -0
package/dist/runtime/worktree.d.ts +55 -0
package/dist/runtime/worktree.d.ts.map +1 -0
package/dist/runtime/worktree.js +175 -0
package/dist/runtime/worktree.js.map +1 -0
package/dist/setup-wizard.d.ts +8 -0
package/dist/setup-wizard.d.ts.map +1 -0
package/dist/setup-wizard.js +73 -0
package/dist/setup-wizard.js.map +1 -0
package/dist/shared/content.d.ts +43 -0
package/dist/shared/content.d.ts.map +1 -0
package/dist/shared/content.js +61 -0
package/dist/shared/content.js.map +1 -0
package/dist/shared/types.d.ts +217 -0
package/dist/shared/types.d.ts.map +1 -0
package/dist/shared/types.js +3 -0
package/dist/shared/types.js.map +1 -0
package/dist/test-runner.d.ts +5 -0
package/dist/test-runner.d.ts.map +1 -0
package/dist/test-runner.js +42 -0
package/dist/test-runner.js.map +1 -0
package/dist/types.d.ts +85 -0
package/dist/types.d.ts.map +1 -0
package/dist/types.js +2 -0
package/dist/types.js.map +1 -0
package/dist/ui/ascii.d.ts +23 -0
package/dist/ui/ascii.d.ts.map +1 -0
package/dist/ui/ascii.js +45 -0
package/dist/ui/ascii.js.map +1 -0
package/dist/ui/colors.d.ts +111 -0
package/dist/ui/colors.d.ts.map +1 -0
package/dist/ui/colors.js +166 -0
package/dist/ui/colors.js.map +1 -0
package/dist/ui/image-attach.d.ts +27 -0
package/dist/ui/image-attach.d.ts.map +1 -0
package/dist/ui/image-attach.js +100 -0
package/dist/ui/image-attach.js.map +1 -0
package/dist/ui/index.d.ts +18 -0
package/dist/ui/index.d.ts.map +1 -0
package/dist/ui/index.js +18 -0
package/dist/ui/index.js.map +1 -0
package/dist/ui/markdown-stream.d.ts +91 -0
package/dist/ui/markdown-stream.d.ts.map +1 -0
package/dist/ui/markdown-stream.js +524 -0
package/dist/ui/markdown-stream.js.map +1 -0
package/dist/ui/plan-renderer.d.ts +36 -0
package/dist/ui/plan-renderer.d.ts.map +1 -0
package/dist/ui/plan-renderer.js +79 -0
package/dist/ui/plan-renderer.js.map +1 -0
package/dist/ui/prompt.d.ts +11 -0
package/dist/ui/prompt.d.ts.map +1 -0
package/dist/ui/prompt.js +1960 -0
package/dist/ui/prompt.js.map +1 -0
package/dist/ui/render-primitives.d.ts +117 -0
package/dist/ui/render-primitives.d.ts.map +1 -0
package/dist/ui/render-primitives.js +322 -0
package/dist/ui/render-primitives.js.map +1 -0
package/dist/ui/render.d.ts +133 -0
package/dist/ui/render.d.ts.map +1 -0
package/dist/ui/render.js +547 -0
package/dist/ui/render.js.map +1 -0
package/dist/ui/session-header.d.ts +30 -0
package/dist/ui/session-header.d.ts.map +1 -0
package/dist/ui/session-header.js +74 -0
package/dist/ui/session-header.js.map +1 -0
package/dist/workspace-guard.d.ts +68 -0
package/dist/workspace-guard.d.ts.map +1 -0
package/dist/workspace-guard.js +168 -0
package/dist/workspace-guard.js.map +1 -0
package/dist/workspace-lock.d.ts +27 -0
package/dist/workspace-lock.d.ts.map +1 -0
package/dist/workspace-lock.js +95 -0
package/dist/workspace-lock.js.map +1 -0
package/package.json +63 -0

package/dist/agent/agent-client.js ADDED Viewed

@@ -0,0 +1,1247 @@
+import { colors } from '../ui/colors.js';
+import { ProvidersManager } from './providers-manager.js';
+import { providerCooldown } from './provider-cooldown.js';
+import { reconstructPartialResponse, isMidStreamResumable, StreamResumeExhaustedError, } from './stream-glue.js';
+import { DEFAULT_API_URL } from '../config.js';
+import { recordTelemetry, telemetry } from './telemetry.js';
+import { getProviderKeyVault } from '../runtime/credential-vault.js';
+import { extractTextFromContent } from '../shared/content.js';
+/* ──────────────────────── Constants ──────────────────────── */
+const MAX_RETRIES = 5;
+const BASE_DELAY_MS = 1500;
+const RETRYABLE_STATUS_CODES = new Set([408, 429, 500, 502, 503]);
+const BASE_URL = process.env.FIXO_API_URL || DEFAULT_API_URL;
+/** Wrapper around `providerCooldown.recordFailure` that also emits a
+ *  telemetry event. Keeps the 6 callsites terse. */
+function trackProviderError(providerId, status, message) {
+    const cooldownMs = providerCooldown.recordFailure(providerId, status, message);
+    if (cooldownMs > 0) {
+        recordTelemetry(telemetry.cooldown({
+            providerId,
+            status,
+            cooldownMs,
+            reason: message.slice(0, 200),
+        }));
+    }
+    else if (status >= 400) {
+        recordTelemetry(telemetry.providerError({ providerId, status, message: message.slice(0, 200) }));
+    }
+    return cooldownMs;
+}
+/* ──────────────────────── ThinkTagParser ──────────────────────── */
+export var ContentType;
+(function (ContentType) {
+    ContentType["TEXT"] = "text";
+    ContentType["THINKING"] = "thinking";
+})(ContentType || (ContentType = {}));
+export class ThinkTagParser {
+    OPEN_TAG = '<think>';
+    CLOSE_TAG = '</think>';
+    _buffer = '';
+    _in_think_tag = false;
+    get in_think_mode() {
+        return this._in_think_tag;
+    }
+    *feed(content) {
+        this._buffer += content;
+        while (this._buffer) {
+            const prev_len = this._buffer.length;
+            let chunk = null;
+            if (!this._in_think_tag) {
+                chunk = this._parse_outside_think();
+            }
+            else {
+                chunk = this._parse_inside_think();
+            }
+            if (chunk) {
+                yield chunk;
+            }
+            else if (this._buffer.length === prev_len) {
+                break;
+            }
+        }
+    }
+    _parse_outside_think() {
+        const think_start = this._buffer.indexOf(this.OPEN_TAG);
+        const orphan_close = this._buffer.indexOf(this.CLOSE_TAG);
+        if (orphan_close !== -1 && (think_start === -1 || orphan_close < think_start)) {
+            const pre_orphan = this._buffer.slice(0, orphan_close);
+            this._buffer = this._buffer.slice(orphan_close + this.CLOSE_TAG.length);
+            if (pre_orphan) {
+                return { type: ContentType.TEXT, content: pre_orphan };
+            }
+            return null;
+        }
+        if (think_start === -1) {
+            const last_bracket = this._buffer.lastIndexOf('<');
+            if (last_bracket !== -1) {
+                const potential_tag = this._buffer.slice(last_bracket);
+                const tag_len = potential_tag.length;
+                if ((tag_len < this.OPEN_TAG.length && this.OPEN_TAG.startsWith(potential_tag)) ||
+                    (tag_len < this.CLOSE_TAG.length && this.CLOSE_TAG.startsWith(potential_tag))) {
+                    const emit = this._buffer.slice(0, last_bracket);
+                    this._buffer = this._buffer.slice(last_bracket);
+                    if (emit) {
+                        return { type: ContentType.TEXT, content: emit };
+                    }
+                    return null;
+                }
+            }
+            const emit = this._buffer;
+            this._buffer = '';
+            if (emit) {
+                return { type: ContentType.TEXT, content: emit };
+            }
+            return null;
+        }
+        const pre_think = this._buffer.slice(0, think_start);
+        this._buffer = this._buffer.slice(think_start + this.OPEN_TAG.length);
+        this._in_think_tag = true;
+        if (pre_think) {
+            return { type: ContentType.TEXT, content: pre_think };
+        }
+        return null;
+    }
+    _parse_inside_think() {
+        const think_end = this._buffer.indexOf(this.CLOSE_TAG);
+        if (think_end === -1) {
+            const last_bracket = this._buffer.lastIndexOf('<');
+            if (last_bracket !== -1 && this._buffer.length - last_bracket < this.CLOSE_TAG.length) {
+                const potential_tag = this._buffer.slice(last_bracket);
+                if (this.CLOSE_TAG.startsWith(potential_tag)) {
+                    const emit = this._buffer.slice(0, last_bracket);
+                    this._buffer = this._buffer.slice(last_bracket);
+                    if (emit) {
+                        return { type: ContentType.THINKING, content: emit };
+                    }
+                    return null;
+                }
+            }
+            const emit = this._buffer;
+            this._buffer = '';
+            if (emit) {
+                return { type: ContentType.THINKING, content: emit };
+            }
+            return null;
+        }
+        const thinking_content = this._buffer.slice(0, think_end);
+        this._buffer = this._buffer.slice(think_end + this.CLOSE_TAG.length);
+        this._in_think_tag = false;
+        if (thinking_content) {
+            return { type: ContentType.THINKING, content: thinking_content };
+        }
+        return null;
+    }
+    flush() {
+        if (this._buffer) {
+            const chunk_type = this._in_think_tag ? ContentType.THINKING : ContentType.TEXT;
+            const content = this._buffer;
+            this._buffer = '';
+            return { type: chunk_type, content };
+        }
+        return null;
+    }
+}
+/* ──────────────────────── HttpError ──────────────────────── */
+export class HttpError extends Error {
+    status;
+    constructor(status, message) {
+        super(message);
+        this.status = status;
+        this.name = 'HttpError';
+    }
+}
+/* ──────────────────────── AgentClient ──────────────────────── */
+export class AgentClient {
+    baseUrl;
+    apiKey;
+    verbose;
+    constructor(apiKey, apiUrl, verbose = false) {
+        this.baseUrl = process.env.FIXO_API_URL || apiUrl || BASE_URL;
+        this.apiKey = apiKey;
+        this.verbose = verbose;
+    }
+    resolveDirectConfig(model) {
+        const modelLower = model.toLowerCase();
+        let providerName = null;
+        if (modelLower.startsWith('gpt-') || modelLower.startsWith('o3-') || modelLower.startsWith('o4-') || modelLower.startsWith('o1-')) {
+            providerName = 'openai';
+        }
+        else if (modelLower.startsWith('claude-')) {
+            providerName = 'anthropic';
+        }
+        else if (modelLower.startsWith('gemini-')) {
+            providerName = 'google';
+        }
+        else {
+            const definitions = ProvidersManager.getAllDefinitions();
+            for (const def of definitions) {
+                if (def.models.some(m => modelLower.includes(m.toLowerCase()))) {
+                    providerName = def.name;
+                    break;
+                }
+            }
+            if (!providerName) {
+                for (const def of definitions) {
+                    if (modelLower.startsWith(def.name + '/') || modelLower.startsWith(def.name + ':')) {
+                        providerName = def.name;
+                        break;
+                    }
+                }
+            }
+        }
+        if (providerName) {
+            const direct = ProvidersManager.getDirectConfig(providerName);
+            if (direct) {
+                const def = ProvidersManager.getDefinition(providerName);
+                return {
+                    baseUrl: direct.baseUrl,
+                    displayName: direct.displayName,
+                    providerName,
+                    openAICompat: def ? def.openAICompat : true,
+                };
+            }
+        }
+        return null;
+    }
+    /**
+     * Maps a model id to the provider that will actually serve the
+     * request — used as the key for `providerCooldown` tracking. The
+     * `freellmapi` sentinel covers the proxy path; everything else
+     * routes through a direct provider.
+     */
+    getProviderId(model) {
+        const direct = this.resolveDirectConfig(model);
+        if (direct)
+            return direct.providerName;
+        return 'freellmapi';
+    }
+    /* ─── Non-streaming chat ─── */
+    async chat(messages, model, options = {}) {
+        const providerId = this.getProviderId(model);
+        providerCooldown.assertAvailable(providerId);
+        const direct = this.resolveDirectConfig(model);
+        const isAnthropicDirect = direct && direct.providerName === 'anthropic';
+        let requestUrl = `${this.baseUrl}/chat/completions`;
+        let headers = {
+            'Content-Type': 'application/json',
+            'Authorization': `Bearer ${this.apiKey}`,
+        };
+        let body = '';
+        if (direct) {
+            // Pillar 4: source the API key from the credential vault so
+            // the raw value never lands in a return value, an error
+            // payload, or a log line. The key is reachable only inside
+            // the withApiKey callback.
+            const vault = getProviderKeyVault();
+            if (isAnthropicDirect) {
+                requestUrl = `${direct.baseUrl}/messages`;
+                headers = await vault.withApiKey(direct.providerName, (key) => ({
+                    'Content-Type': 'application/json',
+                    'x-api-key': key,
+                    'anthropic-version': '2023-06-01',
+                }));
+                body = JSON.stringify(translateOpenAIToAnthropic(messages, model, options));
+            }
+            else {
+                requestUrl = `${direct.baseUrl}/chat/completions`;
+                headers = await vault.withApiKey(direct.providerName, (key) => {
+                    const h = {
+                        'Content-Type': 'application/json',
+                        'Authorization': `Bearer ${key}`,
+                    };
+                    if (direct.providerName === 'zen' || direct.providerName === 'openrouter') {
+                        h['HTTP-Referer'] = 'https://opencode.ai/';
+                        h['X-Title'] = 'opencode';
+                    }
+                    else if (direct.providerName === 'nvidia') {
+                        h['HTTP-Referer'] = 'https://opencode.ai/';
+                        h['X-Title'] = 'opencode';
+                        h['X-BILLING-INVOKE-ORIGIN'] = 'OpenCode';
+                    }
+                    else if (direct.providerName === 'cerebras') {
+                        h['X-Cerebras-3rd-Party-Integration'] = 'opencode';
+                    }
+                    return h;
+                });
+                const bodyObj = {
+                    model,
+                    messages: messagesForOpenAIWire(messages),
+                    stream: false,
+                    ...options,
+                };
+                body = JSON.stringify(bodyObj);
+            }
+        }
+        else {
+            const hasTools = options.tools && Array.isArray(options.tools) && options.tools.length > 0;
+            const bodyObj = {
+                model,
+                messages: messagesForOpenAIWire(messages),
+                stream: false,
+                ...options,
+            };
+            if (hasTools) {
+                bodyObj.x_requires_tools = true;
+                headers['X-Requires-Tools'] = 'true';
+            }
+            if (options.agent_task_type) {
+                bodyObj.x_agent_task_type = options.agent_task_type;
+                bodyObj.x_required_capabilities = options.required_capabilities ?? [];
+                headers['X-Agent-Task-Type'] = options.agent_task_type;
+            }
+            body = JSON.stringify(bodyObj);
+        }
+        let lastError = null;
+        for (let attempt = 0; attempt <= MAX_RETRIES; attempt++) {
+            try {
+                const response = await fetch(requestUrl, {
+                    method: 'POST',
+                    headers,
+                    body,
+                    signal: AbortSignal.timeout(60000), // 60s timeout
+                });
+                // Non-retryable errors
+                if (response.status === 413) {
+                    throw new Error(`Context too large (413). Reduce pinned files or use a model with a larger context window.`);
+                }
+                if (response.status === 404) {
+                    throw new Error(`Model not found (404). Try a different model with /model <name>.`);
+                }
+                // Retryable errors
+                if (RETRYABLE_STATUS_CODES.has(response.status)) {
+                    trackProviderError(providerId, response.status, `HTTP ${response.status}`);
+                    const delayMs = BASE_DELAY_MS * Math.pow(2, attempt);
+                    if (attempt < MAX_RETRIES) {
+                        console.log(`${colors.yellow}⚠  [API] Error ${response.status}. Retrying in ${(delayMs / 1000).toFixed(1)}s (${attempt + 1}/${MAX_RETRIES})${colors.reset}`);
+                        await sleep(delayMs);
+                        continue;
+                    }
+                }
+                if (!response.ok) {
+                    const errorText = await response.text().catch(() => 'Unknown error');
+                    throw new Error(`API error (${response.status}): ${errorText}`);
+                }
+                const rawData = await response.json();
+                const data = isAnthropicDirect ? translateAnthropicToOpenAI(rawData) : rawData;
+                const choice = data.choices[0];
+                providerCooldown.recordSuccess(providerId);
+                // ChatResult.content is `string | null`. The widened
+                // ChatMessage.content union allows blocks on input, but
+                // every provider we ship returns text-only assistant
+                // messages, so we collapse to a string defensively.
+                const respContent = choice?.message?.content;
+                return {
+                    content: respContent == null
+                        ? null
+                        : typeof respContent === 'string'
+                            ? respContent
+                            : extractTextFromContent(respContent),
+                    tool_calls: choice?.message?.tool_calls ?? null,
+                    usage: data.usage ?? { prompt_tokens: 0, completion_tokens: 0, total_tokens: 0 },
+                    model: data.model,
+                    finish_reason: choice?.finish_reason ?? null,
+                };
+            }
+            catch (error) {
+                lastError = error instanceof Error ? error : new Error(String(error));
+                // Don't retry context too large errors
+                if (lastError.message.includes('413')) {
+                    throw lastError;
+                }
+                // 404 from the local FreeLLMAPI proxy = model not in catalog (user typo).
+                // This is a user error, not retryable.
+                if (lastError.message.includes('API error (404)')) {
+                    throw lastError;
+                }
+                // 502 from the local proxy = all configured providers exhausted/failed.
+                // Give actionable error instead of generic "retry".
+                if (lastError.message.includes('API error (502)') || lastError.message.includes('502')) {
+                    const isAllExhausted = lastError.message.toLowerCase().includes('all models') ||
+                        lastError.message.toLowerCase().includes('provider error');
+                    if (isAllExhausted || attempt >= MAX_RETRIES - 1) {
+                        const helpMsg = lastError.message.toLowerCase().includes('provider error')
+                            ? `Provider error: all configured models failed or are rate-limited.\n  → Open http://localhost:5173 → API Keys → add more provider keys.\n  → Or wait a few minutes for rate limits to reset.`
+                            : lastError.message;
+                        throw new Error(helpMsg);
+                    }
+                }
+                // Retry network/timeout errors
+                const isNetworkError = lastError.name === 'TimeoutError' ||
+                    lastError.message.includes('Timeout') ||
+                    lastError.message.includes('ECONNREFUSED') ||
+                    lastError.message.includes('ECONNRESET') ||
+                    lastError.message.includes('fetch failed') ||
+                    lastError.message.includes('ETIMEDOUT');
+                if (lastError.message.includes('ECONNREFUSED') || lastError.message.includes('fetch failed')) {
+                    if (attempt >= MAX_RETRIES - 1) {
+                        throw new Error(`Cannot connect to FreeLLMAPI server at ${this.baseUrl}.\n` +
+                            `  → Make sure the server is running: npm run dev\n` +
+                            `  → Then restart the CLI: npm run cli`);
+                    }
+                }
+                if (isNetworkError && attempt < MAX_RETRIES) {
+                    trackProviderError(providerId, 0, lastError.message.slice(0, 200));
+                    const delayMs = BASE_DELAY_MS * Math.pow(2, attempt);
+                    console.log(`${colors.yellow}⚠  [Network] ${lastError.message.slice(0, 60)}. Retrying in ${(delayMs / 1000).toFixed(1)}s (${attempt + 1}/${MAX_RETRIES})${colors.reset}`);
+                    await sleep(delayMs);
+                    continue;
+                }
+                if (attempt >= MAX_RETRIES)
+                    break;
+                if (!isNetworkError)
+                    throw lastError;
+            }
+        }
+        throw lastError ?? new Error('All retry attempts exhausted.');
+    }
+    /* ─── Streaming chat (SSE) ─── */
+    async *executeSingleChatStreamAttempt(requestUrl, headers, body, model, isAnthropicDirect) {
+        const response = await fetch(requestUrl, {
+            method: 'POST',
+            headers,
+            body,
+            signal: AbortSignal.timeout(60000), // 60s timeout
+        });
+        if (response.status === 413) {
+            throw new Error(`Context too large (413). Reduce pinned files or use a model with a larger context window.`);
+        }
+        if (response.status === 404) {
+            throw new Error(`Model not found (404). Try a different model with /model <name>.`);
+        }
+        if (RETRYABLE_STATUS_CODES.has(response.status)) {
+            throw new HttpError(response.status, `API error ${response.status}`);
+        }
+        if (!response.ok) {
+            const errorText = await response.text().catch(() => 'Unknown error');
+            throw new Error(`API error (${response.status}): ${errorText}`);
+        }
+        if (!response.body) {
+            throw new Error('Response body is null — streaming not supported.');
+        }
+        // Parse SSE stream
+        const reader = response.body.getReader();
+        const decoder = new TextDecoder();
+        let buffer = '';
+        let accumulatedUsage = { prompt_tokens: 0, completion_tokens: 0, total_tokens: 0 };
+        let accumulatedModel = model;
+        const parser = new ThinkTagParser();
+        let currentToolCallIndex = 0;
+        while (true) {
+            const { done, value } = await reader.read();
+            if (done)
+                break;
+            buffer += decoder.decode(value, { stream: true });
+            const lines = buffer.split('\n');
+            buffer = lines.pop() ?? '';
+            for (const line of lines) {
+                const trimmed = line.trim();
+                if (!trimmed || trimmed === ':')
+                    continue; // Skip comments and empty lines
+                if (isAnthropicDirect) {
+                    if (trimmed.startsWith('event: ')) {
+                        continue;
+                    }
+                    if (!trimmed.startsWith('data: '))
+                        continue;
+                    const data = trimmed.slice(6);
+                    let chunk;
+                    try {
+                        chunk = JSON.parse(data);
+                    }
+                    catch {
+                        // skip malformed JSON chunks
+                        continue;
+                    }
+                    if (chunk && (chunk.type === 'error' || chunk.error)) {
+                        const errMsg = chunk.error && chunk.error.message
+                            ? chunk.error.message
+                            : (chunk.message || JSON.stringify(chunk));
+                        throw new Error(`Anthropic stream error: ${errMsg}`);
+                    }
+                    if (chunk.type === 'message_start') {
+                        if (chunk.message && chunk.message.model) {
+                            accumulatedModel = chunk.message.model;
+                        }
+                    }
+                    else if (chunk.type === 'content_block_start') {
+                        const block = chunk.content_block;
+                        currentToolCallIndex = chunk.index ?? 0;
+                        if (block && block.type === 'tool_use') {
+                            yield {
+                                type: 'tool_call_start',
+                                tool_call: {
+                                    index: currentToolCallIndex,
+                                    id: block.id,
+                                    function: {
+                                        name: block.name,
+                                        arguments: '',
+                                    }
+                                }
+                            };
+                        }
+                    }
+                    else if (chunk.type === 'content_block_delta') {
+                        const delta = chunk.delta;
+                        if (delta) {
+                            if (delta.type === 'text_delta' && delta.text) {
+                                for (const parsedChunk of parser.feed(delta.text)) {
+                                    if (parsedChunk.type === ContentType.THINKING) {
+                                        yield { type: 'thinking', thinking: parsedChunk.content };
+                                    }
+                                    else {
+                                        yield { type: 'content', content: parsedChunk.content };
+                                    }
+                                }
+                            }
+                            else if (delta.type === 'input_json_delta' && delta.partial_json) {
+                                yield {
+                                    type: 'tool_call_delta',
+                                    tool_call: {
+                                        index: currentToolCallIndex,
+                                        function: {
+                                            arguments: delta.partial_json,
+                                        }
+                                    }
+                                };
+                            }
+                        }
+                    }
+                    else if (chunk.type === 'message_delta') {
+                        if (chunk.usage) {
+                            accumulatedUsage = {
+                                prompt_tokens: chunk.usage.input_tokens || 0,
+                                completion_tokens: chunk.usage.output_tokens || 0,
+                                total_tokens: (chunk.usage.input_tokens || 0) + (chunk.usage.output_tokens || 0),
+                            };
+                        }
+                    }
+                    else if (chunk.type === 'message_stop') {
+                        const flushed = parser.flush();
+                        if (flushed) {
+                            if (flushed.type === ContentType.THINKING) {
+                                yield { type: 'thinking', thinking: flushed.content };
+                            }
+                            else {
+                                yield { type: 'content', content: flushed.content };
+                            }
+                        }
+                        yield {
+                            type: 'done',
+                            usage: accumulatedUsage,
+                            model: accumulatedModel,
+                        };
+                    }
+                }
+                else {
+                    if (!trimmed.startsWith('data: '))
+                        continue;
+                    const data = trimmed.slice(6);
+                    if (data === '[DONE]') {
+                        const flushed = parser.flush();
+                        if (flushed) {
+                            if (flushed.type === ContentType.THINKING) {
+                                yield { type: 'thinking', thinking: flushed.content };
+                            }
+                            else {
+                                yield { type: 'content', content: flushed.content };
+                            }
+                        }
+                        yield {
+                            type: 'done',
+                            usage: accumulatedUsage,
+                            model: accumulatedModel,
+                        };
+                        return;
+                    }
+                    let chunk;
+                    try {
+                        chunk = JSON.parse(data);
+                    }
+                    catch {
+                        // Skip malformed JSON chunks
+                        if (this.verbose) {
+                            console.log(`${colors.gray}[stream] Skipped malformed chunk: ${data.slice(0, 80)}${colors.reset}`);
+                        }
+                        continue;
+                    }
+                    if (chunk && chunk.error) {
+                        const errMsg = typeof chunk.error === 'object' && chunk.error.message
+                            ? chunk.error.message
+                            : JSON.stringify(chunk.error);
+                        throw new Error(`Stream error: ${errMsg}`);
+                    }
+                    if (chunk.model)
+                        accumulatedModel = chunk.model;
+                    if (chunk.usage) {
+                        accumulatedUsage = chunk.usage;
+                    }
+                    const choice = chunk.choices?.[0];
+                    if (!choice)
+                        continue;
+                    // reasoning_content delta
+                    if (choice.delta.reasoning_content) {
+                        yield {
+                            type: 'thinking',
+                            thinking: choice.delta.reasoning_content,
+                        };
+                    }
+                    // Content delta
+                    if (choice.delta?.content) {
+                        for (const parsedChunk of parser.feed(choice.delta.content)) {
+                            if (parsedChunk.type === ContentType.THINKING) {
+                                yield {
+                                    type: 'thinking',
+                                    thinking: parsedChunk.content,
+                                };
+                            }
+                            else {
+                                yield {
+                                    type: 'content',
+                                    content: parsedChunk.content,
+                                };
+                            }
+                        }
+                    }
+                    // Tool call deltas
+                    if (choice.delta?.tool_calls) {
+                        for (const tc of choice.delta.tool_calls) {
+                            const idx = tc.index ?? 0;
+                            if (tc.id) {
+                                yield {
+                                    type: 'tool_call_start',
+                                    tool_call: {
+                                        index: idx,
+                                        id: tc.id,
+                                        function: {
+                                            name: tc.function?.name ?? '',
+                                            arguments: tc.function?.arguments ?? '',
+                                        },
+                                    },
+                                };
+                            }
+                            else {
+                                yield {
+                                    type: 'tool_call_delta',
+                                    tool_call: {
+                                        index: idx,
+                                        function: {
+                                            arguments: tc.function?.arguments ?? '',
+                                        },
+                                    },
+                                };
+                            }
+                        }
+                    }
+                    // Finish reason
+                    if (choice.finish_reason) {
+                        const flushed = parser.flush();
+                        if (flushed) {
+                            if (flushed.type === ContentType.THINKING) {
+                                yield { type: 'thinking', thinking: flushed.content };
+                            }
+                            else {
+                                yield { type: 'content', content: flushed.content };
+                            }
+                        }
+                        yield {
+                            type: 'done',
+                            finish_reason: choice.finish_reason,
+                            usage: accumulatedUsage,
+                            model: accumulatedModel,
+                        };
+                    }
+                }
+            }
+        }
+        // Stream ended without [DONE]
+        const flushed = parser.flush();
+        if (flushed) {
+            if (flushed.type === ContentType.THINKING) {
+                yield { type: 'thinking', thinking: flushed.content };
+            }
+            else {
+                yield { type: 'content', content: flushed.content };
+            }
+        }
+        yield {
+            type: 'done',
+            usage: accumulatedUsage,
+            model: accumulatedModel,
+        };
+    }
+    async *chatStream(messages, model, options = {}) {
+        const providerId = this.getProviderId(model);
+        providerCooldown.assertAvailable(providerId);
+        const direct = this.resolveDirectConfig(model);
+        const isAnthropicDirect = !!(direct && direct.providerName === 'anthropic');
+        let requestUrl = `${this.baseUrl}/chat/completions`;
+        let headers = {
+            'Content-Type': 'application/json',
+            'Authorization': `Bearer ${this.apiKey}`,
+        };
+        let body = '';
+        if (direct) {
+            // Pillar 4: source the API key from the credential vault.
+            const vault = getProviderKeyVault();
+            if (isAnthropicDirect) {
+                requestUrl = `${direct.baseUrl}/messages`;
+                headers = await vault.withApiKey(direct.providerName, (key) => ({
+                    'Content-Type': 'application/json',
+                    'x-api-key': key,
+                    'anthropic-version': '2023-06-01',
+                }));
+                const payload = translateOpenAIToAnthropic(messages, model, options);
+                payload.stream = true;
+                body = JSON.stringify(payload);
+            }
+            else {
+                requestUrl = `${direct.baseUrl}/chat/completions`;
+                headers = await vault.withApiKey(direct.providerName, (key) => {
+                    const h = {
+                        'Content-Type': 'application/json',
+                        'Authorization': `Bearer ${key}`,
+                    };
+                    if (direct.providerName === 'zen' || direct.providerName === 'openrouter') {
+                        h['HTTP-Referer'] = 'https://opencode.ai/';
+                        h['X-Title'] = 'opencode';
+                    }
+                    else if (direct.providerName === 'nvidia') {
+                        h['HTTP-Referer'] = 'https://opencode.ai/';
+                        h['X-Title'] = 'opencode';
+                        h['X-BILLING-INVOKE-ORIGIN'] = 'OpenCode';
+                    }
+                    else if (direct.providerName === 'cerebras') {
+                        h['X-Cerebras-3rd-Party-Integration'] = 'opencode';
+                    }
+                    return h;
+                });
+                const bodyObj = {
+                    model,
+                    messages: messagesForOpenAIWire(messages),
+                    stream: true,
+                    ...options,
+                };
+                body = JSON.stringify(bodyObj);
+            }
+        }
+        else {
+            const hasTools = options.tools && Array.isArray(options.tools) && options.tools.length > 0;
+            const bodyObj = {
+                model,
+                messages: messagesForOpenAIWire(messages),
+                stream: true,
+                ...options,
+            };
+            if (hasTools) {
+                bodyObj.x_requires_tools = true;
+                headers['X-Requires-Tools'] = 'true';
+            }
+            if (options.agent_task_type) {
+                bodyObj.x_agent_task_type = options.agent_task_type;
+                bodyObj.x_required_capabilities = options.required_capabilities ?? [];
+                headers['X-Agent-Task-Type'] = options.agent_task_type;
+            }
+            body = JSON.stringify(bodyObj);
+        }
+        let lastError = null;
+        let hasYielded = false;
+        for (let attempt = 0; attempt <= MAX_RETRIES; attempt++) {
+            try {
+                const stream = this.executeSingleChatStreamAttempt(requestUrl, headers, body, model, isAnthropicDirect);
+                for await (const chunk of stream) {
+                    hasYielded = true;
+                    yield chunk;
+                }
+                providerCooldown.recordSuccess(providerId);
+                return; // Success — don't retry
+            }
+            catch (error) {
+                lastError = error instanceof Error ? error : new Error(String(error));
+                if (hasYielded) {
+                    // If we have already yielded some chunks, do not retry because we cannot
+                    // rewind/resume the stream. Retrying would yield duplicate tokens on stdout.
+                    throw lastError;
+                }
+                // Don't retry context too large
+                if (lastError.message.includes('413')) {
+                    throw lastError;
+                }
+                // 404 from proxy = model not in catalog (user typo), not retryable
+                if (lastError.message.includes('API error (404)')) {
+                    throw lastError;
+                }
+                // 502 from proxy = all providers exhausted
+                if (lastError.message.includes('API error (502)') || lastError.message.includes('502')) {
+                    const isAllExhausted = lastError.message.toLowerCase().includes('all models') ||
+                        lastError.message.toLowerCase().includes('provider error');
+                    if (isAllExhausted || attempt >= MAX_RETRIES - 1) {
+                        const helpMsg = lastError.message.toLowerCase().includes('provider error')
+                            ? `Provider error: all configured models failed or are rate-limited.\n  → Open http://localhost:5173 → API Keys → add more provider keys.\n  → Or wait a few minutes for rate limits to reset.`
+                            : lastError.message;
+                        throw new Error(helpMsg);
+                    }
+                }
+                const isNetworkError = lastError.name === 'TimeoutError' ||
+                    lastError.message.includes('Timeout') ||
+                    lastError.message.includes('ECONNREFUSED') ||
+                    lastError.message.includes('ECONNRESET') ||
+                    lastError.message.includes('fetch failed') ||
+                    lastError.message.includes('ETIMEDOUT');
+                if (lastError.message.includes('ECONNREFUSED') || lastError.message.includes('fetch failed')) {
+                    if (attempt >= MAX_RETRIES - 1) {
+                        throw new Error(`Cannot connect to FreeLLMAPI server at ${this.baseUrl}.\n` +
+                            `  → Make sure the server is running: npm run dev\n` +
+                            `  → Then restart the CLI: npm run cli`);
+                    }
+                }
+                if (lastError instanceof HttpError && RETRYABLE_STATUS_CODES.has(lastError.status)) {
+                    trackProviderError(providerId, lastError.status, `HTTP ${lastError.status}`);
+                    const delayMs = BASE_DELAY_MS * Math.pow(2, attempt);
+                    if (attempt < MAX_RETRIES) {
+                        console.log(`${colors.yellow}⚠  [API] Error ${lastError.status}. Retrying in ${(delayMs / 1000).toFixed(1)}s (${attempt + 1}/${MAX_RETRIES})${colors.reset}`);
+                        await sleep(delayMs);
+                        continue;
+                    }
+                }
+                if (isNetworkError && attempt < MAX_RETRIES) {
+                    trackProviderError(providerId, 0, lastError.message.slice(0, 200));
+                    const delayMs = BASE_DELAY_MS * Math.pow(2, attempt);
+                    console.log(`${colors.yellow}⚠  [Network] ${lastError.message.slice(0, 60)}. Retrying in ${(delayMs / 1000).toFixed(1)}s (${attempt + 1}/${MAX_RETRIES})${colors.reset}`);
+                    await sleep(delayMs);
+                    continue;
+                }
+                if (attempt >= MAX_RETRIES)
+                    break;
+                if (!isNetworkError)
+                    throw lastError;
+            }
+        }
+        throw lastError ?? new Error('All streaming retry attempts exhausted.');
+    }
+    /**
+     * Streaming chat with autonomous mid-stream resume.
+     *
+     * If the underlying `chatStream` throws *after* at least one chunk
+     * has been yielded, the resume engine inspects the partial response,
+     * appends a "continue from here" payload to the working message list,
+     * and starts a fresh streaming attempt. The consumer sees a single
+     * continuous `AsyncGenerator<StreamChunk>` — the resume is invisible.
+     *
+     * The engine respects:
+     *   - `maxResumeAttempts` (default 3) — additional attempts beyond
+     *     this throw `StreamResumeExhaustedError`.
+     *   - `isMidStreamResumable` — user aborts and 4xx are never resumed.
+     *   - Cuts inside a tool call — the partial text up to the tool call
+     *     boundary is preserved, but the call itself cannot be resumed.
+     *
+     * The method is *additive* and does not change the existing
+     * `chatStream` contract. Callers opt in by switching to this entry
+     * point (see `SingleAgent.streamResponse`).
+     */
+    async *chatStreamWithResume(messages, model, options = {}, maxResumeAttempts = 3) {
+        const workingMessages = messages.map((m) => ({ ...m }));
+        let resumeAttempt = 0;
+        // Per-attempt state. Reset at the top of every loop iteration.
+        let attemptChunks = [];
+        let attemptYielded = false;
+        while (true) {
+            attemptChunks = [];
+            attemptYielded = false;
+            try {
+                for await (const chunk of this.chatStream(workingMessages, model, options)) {
+                    attemptChunks.push(chunk);
+                    attemptYielded = true;
+                    yield chunk;
+                }
+                return; // Natural completion.
+            }
+            catch (err) {
+                // Pre-stream error — the inner chatStream never even started
+                // (413, 404, 502 all-models-exhausted, etc.). Do not attempt a
+                // resume; bubble up unchanged so the agent loop can react.
+                if (!attemptYielded) {
+                    throw err;
+                }
+                // If the inner stream was already yielding a tool call, the
+                // tool call is atomic and cannot be resumed.
+                const last = attemptChunks[attemptChunks.length - 1];
+                const cutDuringToolCall = !!last && (last.type === 'tool_call_start' || last.type === 'tool_call_delta');
+                // Errors that are explicitly not candidates for a resume.
+                if (!isMidStreamResumable(err) || cutDuringToolCall) {
+                    recordTelemetry(telemetry.streamResume({
+                        resumeAttempt,
+                        partialTokens: Math.ceil(reconstructPartialResponse(attemptChunks).length / 4),
+                        ok: false,
+                        reason: cutDuringToolCall ? 'tool-call-cut' : 'non-resumable',
+                    }));
+                    throw new StreamResumeExhaustedError(cutDuringToolCall
+                        ? `Stream cut during a tool call after ${attemptChunks.length} chunks; cannot resume.`
+                        : err instanceof Error
+                            ? `Stream cut and error is non-resumable: ${err.message}`
+                            : 'Stream cut and error is non-resumable.', {
+                        resumeAttempt,
+                        chunks: attemptChunks,
+                        partial: reconstructPartialResponse(attemptChunks),
+                        cutDuringToolCall,
+                    });
+                }
+                if (resumeAttempt >= maxResumeAttempts) {
+                    recordTelemetry(telemetry.streamResume({
+                        resumeAttempt,
+                        partialTokens: Math.ceil(reconstructPartialResponse(attemptChunks).length / 4),
+                        ok: false,
+                        reason: 'exhausted',
+                    }));
+                    throw new StreamResumeExhaustedError(`Stream resume attempts exhausted (${resumeAttempt}/${maxResumeAttempts}).`, {
+                        resumeAttempt,
+                        chunks: attemptChunks,
+                        partial: reconstructPartialResponse(attemptChunks),
+                    });
+                }
+                const partial = reconstructPartialResponse(attemptChunks);
+                if (partial === '') {
+                    recordTelemetry(telemetry.streamResume({ resumeAttempt, partialTokens: 0, ok: false, reason: 'empty-partial' }));
+                    throw new StreamResumeExhaustedError('No partial content available to resume from.', { resumeAttempt, chunks: attemptChunks, partial: '' });
+                }
+                // Build the resume payload: assistant partial + user "continue".
+                workingMessages.push({ role: 'assistant', content: partial });
+                workingMessages.push({
+                    role: 'user',
+                    content: `[STREAM RESUMED] Your previous response was interrupted at ` +
+                        `${attemptChunks.length} chunks. Continue exactly from where you left off. ` +
+                        'Do NOT repeat the partial content. Do NOT add preamble. ' +
+                        'Begin mid-sentence if needed.',
+                });
+                resumeAttempt += 1;
+                // Telemetry: this attempt succeeded; the next one is in flight.
+                recordTelemetry(telemetry.streamResume({
+                    resumeAttempt,
+                    partialTokens: Math.ceil(partial.length / 4),
+                    ok: true,
+                }));
+                // Loop continues with the augmented message list.
+            }
+        }
+    }
+    async getEmbedding(text, model = 'text-embedding-3-small') {
+        const providerId = this.getProviderId(model);
+        providerCooldown.assertAvailable(providerId);
+        const direct = this.resolveDirectConfig(model);
+        let requestUrl = `${this.baseUrl}/embeddings`;
+        let headers = {
+            'Content-Type': 'application/json',
+            'Authorization': `Bearer ${this.apiKey}`,
+        };
+        if (direct) {
+            // Pillar 4: source the API key from the credential vault.
+            const vault = getProviderKeyVault();
+            requestUrl = `${direct.baseUrl}/embeddings`;
+            headers = await vault.withApiKey(direct.providerName, (key) => ({
+                'Content-Type': 'application/json',
+                'Authorization': `Bearer ${key}`,
+            }));
+        }
+        const body = JSON.stringify({
+            model,
+            input: text,
+        });
+        for (let attempt = 0; attempt <= MAX_RETRIES; attempt++) {
+            try {
+                const response = await fetch(requestUrl, {
+                    method: 'POST',
+                    headers,
+                    body,
+                });
+                if (RETRYABLE_STATUS_CODES.has(response.status)) {
+                    trackProviderError(providerId, response.status, `HTTP ${response.status}`);
+                    const delayMs = BASE_DELAY_MS * Math.pow(2, attempt);
+                    if (attempt < MAX_RETRIES) {
+                        if (this.verbose) {
+                            console.log(`${colors.yellow}⚠  [API] Embedding error ${response.status}. Retrying in ${(delayMs / 1000).toFixed(1)}s (${attempt + 1}/${MAX_RETRIES})${colors.reset}`);
+                        }
+                        await sleep(delayMs);
+                        continue;
+                    }
+                }
+                if (!response.ok) {
+                    const errorText = await response.text().catch(() => 'Unknown error');
+                    throw new Error(`API error (${response.status}): ${errorText}`);
+                }
+                const data = await response.json();
+                if (data.data && data.data[0] && data.data[0].embedding) {
+                    providerCooldown.recordSuccess(providerId);
+                    return data.data[0].embedding;
+                }
+                throw new Error('Malformed embedding response structure');
+            }
+            catch (error) {
+                if (attempt >= MAX_RETRIES)
+                    throw error;
+                const isNetworkError = error instanceof Error && (error.name === 'TimeoutError' ||
+                    error.message.includes('ECONNREFUSED') ||
+                    error.message.includes('fetch failed') ||
+                    error.message.includes('ETIMEDOUT'));
+                if (isNetworkError) {
+                    trackProviderError(providerId, 0, error.message.slice(0, 200));
+                }
+                const delayMs = BASE_DELAY_MS * Math.pow(2, attempt);
+                await sleep(delayMs);
+            }
+        }
+        throw new Error('All embedding retry attempts exhausted.');
+    }
+    /* ─── Health probe ─── */
+    async ping() {
+        try {
+            const response = await fetch(`${this.baseUrl}/models`, {
+                headers: {
+                    'Authorization': `Bearer ${this.apiKey}`,
+                },
+                signal: AbortSignal.timeout(4000),
+            });
+            return response.ok;
+        }
+        catch {
+            return false;
+        }
+    }
+}
+/* ──────────────────────── Helpers ──────────────────────── */
+function sleep(ms) {
+    return new Promise(resolve => setTimeout(resolve, ms));
+}
+/* ──────────────────────── Translation Helpers ──────────────────────── */
+/**
+ * Translate a `ChatMessage.content` value to the Anthropic `user`
+ * content shape. Plain strings stay verbatim; block arrays are
+ * mapped 1:1 with image blocks rewritten to Anthropic's `source`
+ * sub-object.
+ */
+function toAnthropicUserContent(content) {
+    if (content == null)
+        return '';
+    if (typeof content === 'string')
+        return content;
+    return content.map((block) => {
+        if (block.type === 'text')
+            return { type: 'text', text: block.text };
+        // image
+        if (block.source.kind === 'base64') {
+            return {
+                type: 'image',
+                source: {
+                    type: 'base64',
+                    media_type: block.source.mediaType,
+                    data: block.source.data,
+                },
+            };
+        }
+        // url — Anthropic supports url-shaped image sources as of 2024-06.
+        return {
+            type: 'image',
+            source: { type: 'url', url: block.source.url },
+        };
+    });
+}
+/**
+ * Translate a `ChatMessage.content` value to the OpenAI chat
+ * completions `user` content shape (string OR a block array with
+ * `image_url` blocks, per the OpenAI vision spec).
+ */
+function toOpenAIUserContent(content) {
+    if (content == null)
+        return '';
+    if (typeof content === 'string')
+        return content;
+    return content.map((block) => {
+        if (block.type === 'text')
+            return { type: 'text', text: block.text };
+        if (block.source.kind === 'base64') {
+            const dataUrl = `data:${block.source.mediaType};base64,${block.source.data}`;
+            return { type: 'image_url', image_url: { url: dataUrl } };
+        }
+        return { type: 'image_url', image_url: { url: block.source.url } };
+    });
+}
+/**
+ * Rewrite a `ChatMessage[]` so every user message with content
+ * blocks is translated to the OpenAI-vision wire shape. Messages
+ * with plain-string content are returned untouched; assistant
+ * and tool messages collapse to plain strings (those providers
+ * never accept image blocks in those roles).
+ *
+ * The original array is never mutated; returned as `unknown[]`
+ * because the OpenAI-vision wire shape is no longer assignable
+ * to the strict `ChatMessage` union.
+ */
+function messagesForOpenAIWire(messages) {
+    let needsRewrite = false;
+    for (const m of messages) {
+        if (Array.isArray(m.content)) {
+            needsRewrite = true;
+            break;
+        }
+    }
+    if (!needsRewrite)
+        return messages;
+    return messages.map((m) => {
+        if (m.role === 'user') {
+            return { ...m, content: toOpenAIUserContent(m.content) };
+        }
+        // Assistant / system / tool: collapse to text. We never send
+        // images on those roles to OpenAI-compat endpoints.
+        if (Array.isArray(m.content)) {
+            return { ...m, content: extractTextFromContent(m.content) };
+        }
+        return m;
+    });
+}
+function translateOpenAIToAnthropic(messages, model, options) {
+    let system = '';
+    const anthropicMessages = [];
+    for (const msg of messages) {
+        if (msg.role === 'system') {
+            // System messages must be plain text. Image blocks on a
+            // system message are nonsensical; we flatten defensively.
+            const sysText = extractTextFromContent(msg.content);
+            system = system ? `${system}\n${sysText}` : sysText;
+        }
+        else if (msg.role === 'user') {
+            // User messages may carry image blocks. Translate the
+            // OpenAI-shaped block array to Anthropic's native block
+            // shape; plain strings continue to pass through verbatim.
+            anthropicMessages.push({
+                role: 'user',
+                content: toAnthropicUserContent(msg.content),
+            });
+        }
+        else if (msg.role === 'assistant') {
+            const assistantText = extractTextFromContent(msg.content);
+            if (msg.tool_calls && msg.tool_calls.length > 0) {
+                const contentBlocks = [];
+                if (assistantText.length > 0) {
+                    contentBlocks.push({ type: 'text', text: assistantText });
+                }
+                for (const tc of msg.tool_calls) {
+                    let inputObj = {};
+                    try {
+                        inputObj = JSON.parse(tc.function.arguments);
+                    }
+                    catch {
+                        inputObj = { raw: tc.function.arguments };
+                    }
+                    contentBlocks.push({
+                        type: 'tool_use',
+                        id: tc.id,
+                        name: tc.function.name,
+                        input: inputObj,
+                    });
+                }
+                anthropicMessages.push({
+                    role: 'assistant',
+                    content: contentBlocks,
+                });
+            }
+            else {
+                anthropicMessages.push({
+                    role: 'assistant',
+                    content: assistantText,
+                });
+            }
+        }
+        else if (msg.role === 'tool') {
+            anthropicMessages.push({
+                role: 'user',
+                content: [
+                    {
+                        type: 'tool_result',
+                        tool_use_id: msg.tool_call_id,
+                        content: extractTextFromContent(msg.content),
+                    },
+                ],
+            });
+        }
+    }
+    const body = {
+        model,
+        messages: anthropicMessages,
+        max_tokens: options.max_tokens ?? 4096,
+    };
+    if (system) {
+        body.system = system;
+    }
+    if (options.temperature !== undefined) {
+        body.temperature = options.temperature;
+    }
+    if (options.tools && options.tools.length > 0) {
+        body.tools = options.tools.map(t => ({
+            name: t.function.name,
+            description: t.function.description,
+            input_schema: t.function.parameters,
+        }));
+        if (options.tool_choice) {
+            if (options.tool_choice === 'auto' || options.tool_choice === 'none') {
+                body.tool_choice = { type: options.tool_choice };
+            }
+            else if (typeof options.tool_choice === 'object' && options.tool_choice.function) {
+                body.tool_choice = {
+                    type: 'any',
+                    name: options.tool_choice.function.name,
+                };
+            }
+        }
+    }
+    return body;
+}
+function translateAnthropicToOpenAI(anthropicRes) {
+    const contentBlocks = Array.isArray(anthropicRes.content) ? anthropicRes.content : [];
+    let text = '';
+    const toolCalls = [];
+    for (const block of contentBlocks) {
+        if (block.type === 'text') {
+            text += block.text;
+        }
+        else if (block.type === 'tool_use') {
+            toolCalls.push({
+                id: block.id,
+                type: 'function',
+                function: {
+                    name: block.name,
+                    arguments: JSON.stringify(block.input),
+                },
+            });
+        }
+    }
+    const finishReasonMap = {
+        end_turn: 'stop',
+        max_tokens: 'length',
+        tool_use: 'tool_calls',
+        stop_sequence: 'stop',
+    };
+    const choice = {
+        index: 0,
+        message: {
+            role: 'assistant',
+            content: text || null,
+        },
+        finish_reason: finishReasonMap[anthropicRes.stop_reason] || 'stop',
+    };
+    if (toolCalls.length > 0) {
+        choice.message.tool_calls = toolCalls;
+    }
+    const usage = anthropicRes.usage ? {
+        prompt_tokens: anthropicRes.usage.input_tokens || 0,
+        completion_tokens: anthropicRes.usage.output_tokens || 0,
+        total_tokens: (anthropicRes.usage.input_tokens || 0) + (anthropicRes.usage.output_tokens || 0),
+    } : { prompt_tokens: 0, completion_tokens: 0, total_tokens: 0 };
+    return {
+        id: anthropicRes.id || `anthropic-${Date.now()}`,
+        object: 'chat.completion',
+        created: Math.floor(Date.now() / 1000),
+        model: anthropicRes.model || '',
+        choices: [choice],
+        usage,
+    };
+}
+//# sourceMappingURL=agent-client.js.map