npm - @juspay/neurolink - Versions diffs - 9.40.0 → 9.42.0 - Mend

@juspay/neurolink 9.40.0 → 9.42.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (224) hide show

package/CHANGELOG.md +12 -0
package/README.md +7 -1
package/dist/auth/anthropicOAuth.d.ts +18 -3
package/dist/auth/anthropicOAuth.js +137 -4
package/dist/auth/providers/firebase.js +5 -1
package/dist/auth/providers/jwt.js +5 -1
package/dist/auth/providers/workos.js +5 -1
package/dist/auth/sessionManager.d.ts +1 -1
package/dist/auth/sessionManager.js +58 -27
package/dist/browser/neurolink.min.js +471 -445
package/dist/cli/commands/mcp.js +3 -0
package/dist/cli/commands/proxy.d.ts +2 -1
package/dist/cli/commands/proxy.js +279 -16
package/dist/cli/commands/task.d.ts +56 -0
package/dist/cli/commands/task.js +838 -0
package/dist/cli/factories/commandFactory.d.ts +2 -0
package/dist/cli/factories/commandFactory.js +38 -0
package/dist/cli/parser.js +8 -4
package/dist/client/aiSdkAdapter.js +3 -0
package/dist/client/streamingClient.js +30 -10
package/dist/core/modules/GenerationHandler.js +3 -2
package/dist/core/redisConversationMemoryManager.js +7 -3
package/dist/evaluation/BatchEvaluator.js +4 -1
package/dist/evaluation/hooks/observabilityHooks.js +5 -3
package/dist/evaluation/pipeline/evaluationPipeline.d.ts +3 -2
package/dist/evaluation/pipeline/evaluationPipeline.js +20 -8
package/dist/evaluation/pipeline/strategies/batchStrategy.js +6 -3
package/dist/evaluation/pipeline/strategies/samplingStrategy.js +18 -10
package/dist/lib/auth/anthropicOAuth.d.ts +18 -3
package/dist/lib/auth/anthropicOAuth.js +137 -4
package/dist/lib/auth/providers/firebase.js +5 -1
package/dist/lib/auth/providers/jwt.js +5 -1
package/dist/lib/auth/providers/workos.js +5 -1
package/dist/lib/auth/sessionManager.d.ts +1 -1
package/dist/lib/auth/sessionManager.js +58 -27
package/dist/lib/client/aiSdkAdapter.js +3 -0
package/dist/lib/client/streamingClient.js +30 -10
package/dist/lib/core/modules/GenerationHandler.js +3 -2
package/dist/lib/core/redisConversationMemoryManager.js +7 -3
package/dist/lib/evaluation/BatchEvaluator.js +4 -1
package/dist/lib/evaluation/hooks/observabilityHooks.js +5 -3
package/dist/lib/evaluation/pipeline/evaluationPipeline.d.ts +3 -2
package/dist/lib/evaluation/pipeline/evaluationPipeline.js +20 -8
package/dist/lib/evaluation/pipeline/strategies/batchStrategy.js +6 -3
package/dist/lib/evaluation/pipeline/strategies/samplingStrategy.js +18 -10
package/dist/lib/neurolink.d.ts +18 -1
package/dist/lib/neurolink.js +367 -484
package/dist/lib/observability/otelBridge.d.ts +2 -2
package/dist/lib/observability/otelBridge.js +12 -3
package/dist/lib/providers/amazonBedrock.js +2 -4
package/dist/lib/providers/anthropic.d.ts +9 -5
package/dist/lib/providers/anthropic.js +19 -14
package/dist/lib/providers/anthropicBaseProvider.d.ts +3 -3
package/dist/lib/providers/anthropicBaseProvider.js +5 -4
package/dist/lib/providers/azureOpenai.d.ts +1 -1
package/dist/lib/providers/azureOpenai.js +5 -4
package/dist/lib/providers/googleAiStudio.js +30 -1
package/dist/lib/providers/googleVertex.js +28 -6
package/dist/lib/providers/huggingFace.d.ts +3 -3
package/dist/lib/providers/huggingFace.js +6 -8
package/dist/lib/providers/litellm.js +41 -29
package/dist/lib/providers/mistral.js +2 -1
package/dist/lib/providers/ollama.js +80 -23
package/dist/lib/providers/openAI.js +3 -2
package/dist/lib/providers/openRouter.js +2 -1
package/dist/lib/providers/openaiCompatible.d.ts +4 -4
package/dist/lib/providers/openaiCompatible.js +4 -4
package/dist/lib/proxy/claudeFormat.d.ts +3 -2
package/dist/lib/proxy/claudeFormat.js +25 -20
package/dist/lib/proxy/cloaking/plugins/sessionIdentity.d.ts +2 -6
package/dist/lib/proxy/cloaking/plugins/sessionIdentity.js +9 -33
package/dist/lib/proxy/modelRouter.js +3 -0
package/dist/lib/proxy/oauthFetch.d.ts +1 -1
package/dist/lib/proxy/oauthFetch.js +65 -72
package/dist/lib/proxy/proxyConfig.js +44 -24
package/dist/lib/proxy/proxyEnv.d.ts +19 -0
package/dist/lib/proxy/proxyEnv.js +73 -0
package/dist/lib/proxy/proxyFetch.js +50 -4
package/dist/lib/proxy/proxyTracer.d.ts +133 -0
package/dist/lib/proxy/proxyTracer.js +645 -0
package/dist/lib/proxy/rawStreamCapture.d.ts +10 -0
package/dist/lib/proxy/rawStreamCapture.js +83 -0
package/dist/lib/proxy/requestLogger.d.ts +32 -5
package/dist/lib/proxy/requestLogger.js +406 -37
package/dist/lib/proxy/sseInterceptor.d.ts +97 -0
package/dist/lib/proxy/sseInterceptor.js +402 -0
package/dist/lib/proxy/usageStats.d.ts +4 -3
package/dist/lib/proxy/usageStats.js +25 -12
package/dist/lib/rag/chunkers/MarkdownChunker.js +13 -5
package/dist/lib/rag/chunking/markdownChunker.js +15 -6
package/dist/lib/server/routes/claudeProxyRoutes.d.ts +7 -2
package/dist/lib/server/routes/claudeProxyRoutes.js +1737 -508
package/dist/lib/services/server/ai/observability/instrumentation.d.ts +7 -1
package/dist/lib/services/server/ai/observability/instrumentation.js +240 -40
package/dist/lib/tasks/backends/bullmqBackend.d.ts +33 -0
package/dist/lib/tasks/backends/bullmqBackend.js +196 -0
package/dist/lib/tasks/backends/nodeTimeoutBackend.d.ts +27 -0
package/dist/lib/tasks/backends/nodeTimeoutBackend.js +141 -0
package/dist/lib/tasks/backends/taskBackendRegistry.d.ts +31 -0
package/dist/lib/tasks/backends/taskBackendRegistry.js +66 -0
package/dist/lib/tasks/errors.d.ts +31 -0
package/dist/lib/tasks/errors.js +18 -0
package/dist/lib/tasks/store/fileTaskStore.d.ts +43 -0
package/dist/lib/tasks/store/fileTaskStore.js +179 -0
package/dist/lib/tasks/store/redisTaskStore.d.ts +43 -0
package/dist/lib/tasks/store/redisTaskStore.js +197 -0
package/dist/lib/tasks/taskExecutor.d.ts +21 -0
package/dist/lib/tasks/taskExecutor.js +166 -0
package/dist/lib/tasks/taskManager.d.ts +63 -0
package/dist/lib/tasks/taskManager.js +426 -0
package/dist/lib/tasks/tools/taskTools.d.ts +135 -0
package/dist/lib/tasks/tools/taskTools.js +274 -0
package/dist/lib/telemetry/index.d.ts +2 -1
package/dist/lib/telemetry/index.js +2 -1
package/dist/lib/telemetry/telemetryService.d.ts +3 -0
package/dist/lib/telemetry/telemetryService.js +65 -5
package/dist/lib/types/cli.d.ts +10 -0
package/dist/lib/types/configTypes.d.ts +3 -0
package/dist/lib/types/generateTypes.d.ts +13 -0
package/dist/lib/types/index.d.ts +1 -0
package/dist/lib/types/proxyTypes.d.ts +37 -5
package/dist/lib/types/streamTypes.d.ts +25 -3
package/dist/lib/types/taskTypes.d.ts +275 -0
package/dist/lib/types/taskTypes.js +37 -0
package/dist/lib/utils/messageBuilder.js +3 -2
package/dist/lib/utils/providerHealth.d.ts +18 -0
package/dist/lib/utils/providerHealth.js +240 -9
package/dist/lib/utils/providerUtils.js +14 -8
package/dist/lib/utils/toolChoice.d.ts +4 -0
package/dist/lib/utils/toolChoice.js +7 -0
package/dist/neurolink.d.ts +18 -1
package/dist/neurolink.js +367 -484
package/dist/observability/otelBridge.d.ts +2 -2
package/dist/observability/otelBridge.js +12 -3
package/dist/providers/amazonBedrock.js +2 -4
package/dist/providers/anthropic.d.ts +9 -5
package/dist/providers/anthropic.js +19 -14
package/dist/providers/anthropicBaseProvider.d.ts +3 -3
package/dist/providers/anthropicBaseProvider.js +5 -4
package/dist/providers/azureOpenai.d.ts +1 -1
package/dist/providers/azureOpenai.js +5 -4
package/dist/providers/googleAiStudio.js +30 -1
package/dist/providers/googleVertex.js +28 -6
package/dist/providers/huggingFace.d.ts +3 -3
package/dist/providers/huggingFace.js +6 -7
package/dist/providers/litellm.js +41 -29
package/dist/providers/mistral.js +2 -1
package/dist/providers/ollama.js +80 -23
package/dist/providers/openAI.js +3 -2
package/dist/providers/openRouter.js +2 -1
package/dist/providers/openaiCompatible.d.ts +4 -4
package/dist/providers/openaiCompatible.js +4 -3
package/dist/proxy/claudeFormat.d.ts +3 -2
package/dist/proxy/claudeFormat.js +25 -20
package/dist/proxy/cloaking/plugins/sessionIdentity.d.ts +2 -6
package/dist/proxy/cloaking/plugins/sessionIdentity.js +9 -33
package/dist/proxy/modelRouter.js +3 -0
package/dist/proxy/oauthFetch.d.ts +1 -1
package/dist/proxy/oauthFetch.js +65 -72
package/dist/proxy/proxyConfig.js +44 -24
package/dist/proxy/proxyEnv.d.ts +19 -0
package/dist/proxy/proxyEnv.js +72 -0
package/dist/proxy/proxyFetch.js +50 -4
package/dist/proxy/proxyTracer.d.ts +133 -0
package/dist/proxy/proxyTracer.js +644 -0
package/dist/proxy/rawStreamCapture.d.ts +10 -0
package/dist/proxy/rawStreamCapture.js +82 -0
package/dist/proxy/requestLogger.d.ts +32 -5
package/dist/proxy/requestLogger.js +406 -37
package/dist/proxy/sseInterceptor.d.ts +97 -0
package/dist/proxy/sseInterceptor.js +401 -0
package/dist/proxy/usageStats.d.ts +4 -3
package/dist/proxy/usageStats.js +25 -12
package/dist/rag/chunkers/MarkdownChunker.js +13 -5
package/dist/rag/chunking/markdownChunker.js +15 -6
package/dist/server/routes/claudeProxyRoutes.d.ts +7 -2
package/dist/server/routes/claudeProxyRoutes.js +1737 -508
package/dist/services/server/ai/observability/instrumentation.d.ts +7 -1
package/dist/services/server/ai/observability/instrumentation.js +240 -40
package/dist/tasks/backends/bullmqBackend.d.ts +33 -0
package/dist/tasks/backends/bullmqBackend.js +195 -0
package/dist/tasks/backends/nodeTimeoutBackend.d.ts +27 -0
package/dist/tasks/backends/nodeTimeoutBackend.js +140 -0
package/dist/tasks/backends/taskBackendRegistry.d.ts +31 -0
package/dist/tasks/backends/taskBackendRegistry.js +65 -0
package/dist/tasks/errors.d.ts +31 -0
package/dist/tasks/errors.js +17 -0
package/dist/tasks/store/fileTaskStore.d.ts +43 -0
package/dist/tasks/store/fileTaskStore.js +178 -0
package/dist/tasks/store/redisTaskStore.d.ts +43 -0
package/dist/tasks/store/redisTaskStore.js +196 -0
package/dist/tasks/taskExecutor.d.ts +21 -0
package/dist/tasks/taskExecutor.js +165 -0
package/dist/tasks/taskManager.d.ts +63 -0
package/dist/tasks/taskManager.js +425 -0
package/dist/tasks/tools/taskTools.d.ts +135 -0
package/dist/tasks/tools/taskTools.js +273 -0
package/dist/telemetry/index.d.ts +2 -1
package/dist/telemetry/index.js +2 -1
package/dist/telemetry/telemetryService.d.ts +3 -0
package/dist/telemetry/telemetryService.js +65 -5
package/dist/types/cli.d.ts +10 -0
package/dist/types/configTypes.d.ts +3 -0
package/dist/types/generateTypes.d.ts +13 -0
package/dist/types/index.d.ts +1 -0
package/dist/types/proxyTypes.d.ts +37 -5
package/dist/types/streamTypes.d.ts +25 -3
package/dist/types/taskTypes.d.ts +275 -0
package/dist/types/taskTypes.js +36 -0
package/dist/utils/messageBuilder.js +3 -2
package/dist/utils/providerHealth.d.ts +18 -0
package/dist/utils/providerHealth.js +240 -9
package/dist/utils/providerUtils.js +14 -8
package/dist/utils/toolChoice.d.ts +4 -0
package/dist/utils/toolChoice.js +6 -0
package/docs/assets/dashboards/neurolink-proxy-observability-dashboard.json +6609 -0
package/docs/changelog.md +252 -0
package/package.json +19 -1
package/scripts/observability/check-proxy-telemetry.mjs +235 -0
package/scripts/observability/docker-compose.proxy-observability.yaml +55 -0
package/scripts/observability/import-openobserve-dashboard.mjs +240 -0
package/scripts/observability/manage-local-openobserve.sh +184 -0
package/scripts/observability/otel-collector.proxy-observability.yaml +78 -0
package/scripts/observability/proxy-observability.env.example +23 -0

package/dist/server/routes/claudeProxyRoutes.js CHANGED Viewed

@@ -1,3 +1,4 @@
+/* eslint-disable max-depth */
 /**
  * Claude-Compatible Proxy Routes
  *
@@ -9,20 +10,23 @@
  * provider/model pairs (e.g. "claude-sonnet-4-20250514" -> vertex/gemini-2.5-pro).
  * Without a router, models are passed through to the Anthropic provider.
  */
-import { readFile, access } from "node:fs/promises";
-import { join } from "node:path";
+import { access, mkdir, readFile, rename, writeFile } from "node:fs/promises";
 import { homedir } from "node:os";
-import { parseClaudeRequest, serializeClaudeResponse, ClaudeStreamSerializer, buildClaudeError, generateToolUseId, } from "../../proxy/claudeFormat.js";
+import { join } from "node:path";
+import { buildStableClaudeCodeBillingHeader, CLAUDE_CLI_USER_AGENT, CLAUDE_CODE_OAUTH_BETAS, getOrCreateClaudeCodeIdentity, parseClaudeCodeUserId, } from "../../auth/anthropicOAuth.js";
+import { parseQuotaHeaders, saveAccountQuota } from "../../proxy/accountQuota.js";
+import { buildClaudeError, ClaudeStreamSerializer, generateToolUseId, parseClaudeRequest, serializeClaudeResponse, } from "../../proxy/claudeFormat.js";
+import { ProxyTracer } from "../../proxy/proxyTracer.js";
+import { createRawStreamCapture } from "../../proxy/rawStreamCapture.js";
+import { logBodyCapture, logRequest, logRequestAttempt, logStreamError } from "../../proxy/requestLogger.js";
+import { createSSEInterceptor } from "../../proxy/sseInterceptor.js";
+import { needsRefresh, persistTokens, refreshToken } from "../../proxy/tokenRefresh.js";
+import { recordAttempt, recordAttemptError, recordCooldown, recordFinalError, recordFinalSuccess, } from "../../proxy/usageStats.js";
 import { logger } from "../../utils/logger.js";
-import { recordRequest, recordSuccess, recordError, recordCooldown, } from "../../proxy/usageStats.js";
-import { logRequest, logFullRequestResponse, logStreamError, } from "../../proxy/requestLogger.js";
-import { parseQuotaHeaders, saveAccountQuota, } from "../../proxy/accountQuota.js";
-import { needsRefresh, refreshToken, persistTokens, } from "../../proxy/tokenRefresh.js";
+import { ProviderHealthChecker } from "../../utils/providerHealth.js";
 // ---------------------------------------------------------------------------
 // Helpers
 // ---------------------------------------------------------------------------
-/** Header names whose values must be masked in debug logs. */
-const SENSITIVE_HEADERS = new Set(["authorization", "x-api-key"]);
 /** Headers that must never be forwarded upstream to Anthropic. */
 const BLOCKED_UPSTREAM_HEADERS = new Set([
     "cookie",
@@ -32,22 +36,6 @@ const BLOCKED_UPSTREAM_HEADERS = new Set([
     "content-length",
     "transfer-encoding",
 ]);
-/** Return a shallow copy of `headers` with sensitive values redacted. */
-function redactSensitiveHeaders(headers) {
-    const redacted = {};
-    for (const [key, value] of Object.entries(headers)) {
-        if (SENSITIVE_HEADERS.has(key.toLowerCase()) && value.length > 8) {
-            redacted[key] = value.substring(0, 8) + "...";
-        }
-        else if (SENSITIVE_HEADERS.has(key.toLowerCase())) {
-            redacted[key] = "***";
-        }
-        else {
-            redacted[key] = value;
-        }
-    }
-    return redacted;
-}
 // ---------------------------------------------------------------------------
 // Module-level state
 // ---------------------------------------------------------------------------
@@ -83,65 +71,192 @@ function advancePrimaryIfCurrent(accountKey, enabledCount, primaryAccountKey) {
     }
     primaryAccountIndex = (primaryAccountIndex + 1) % enabledCount;
 }
-// ---------------------------------------------------------------------------
-// OAuth polyfill helpers (extracted to reduce block nesting)
-// ---------------------------------------------------------------------------
 const snapshotCache = new Map();
 const SNAPSHOT_CACHE_TTL_MS = 5 * 60 * 1000; // 5 minutes
-/**
- * Load a header snapshot captured from a real Claude Code session and apply
- * any headers the client didn't send.  This makes non-Claude-Code requests
- * (e.g. from Curator, custom apps) appear identical to Claude Code.
- */
-async function applyHeaderSnapshot(headers, accountLabel) {
+const SNAPSHOT_STABLE_HEADERS = new Set([
+    "accept",
+    "accept-encoding",
+    "accept-language",
+    "anthropic-beta",
+    "anthropic-dangerous-direct-browser-access",
+    "anthropic-version",
+    "sec-fetch-mode",
+    "user-agent",
+    "x-app",
+    "x-stainless-arch",
+    "x-stainless-lang",
+    "x-stainless-os",
+    "x-stainless-package-version",
+    "x-stainless-retry-count",
+    "x-stainless-runtime",
+    "x-stainless-runtime-version",
+    "x-stainless-timeout",
+    "x-subscription-tier",
+]);
+const NON_CLAUDE_OAUTH_BETAS = [
+    "oauth-2025-04-20",
+    "claude-code-20250219",
+    "fine-grained-tool-streaming-2025-05-14",
+];
+function getSnapshotSafeLabel(accountLabel) {
+    return accountLabel.replace(/[^a-zA-Z0-9._@-]/g, "_");
+}
+function getSnapshotPath(accountLabel) {
+    return join(homedir(), ".neurolink", "header-snapshots", `anthropic_${getSnapshotSafeLabel(accountLabel)}.json`);
+}
+function applySnapshotHeaders(headers, snapshot) {
+    if (!snapshot?.headers) {
+        return;
+    }
+    for (const [sk, sv] of Object.entries(snapshot.headers)) {
+        const lower = sk.toLowerCase();
+        if (typeof sv === "string" &&
+            !headers[lower] &&
+            !BLOCKED_UPSTREAM_HEADERS.has(lower) &&
+            lower !== "authorization" &&
+            lower !== "x-api-key" &&
+            lower !== "x-claude-code-session-id") {
+            headers[lower] = sv;
+        }
+    }
+}
+async function loadClaudeSnapshot(accountLabel) {
     try {
-        // Sanitize accountLabel to prevent directory traversal
-        const safeLabel = accountLabel.replace(/[^a-zA-Z0-9._@-]/g, "_");
-        // Check cache first
+        const safeLabel = getSnapshotSafeLabel(accountLabel);
         const cached = snapshotCache.get(safeLabel);
         if (cached && Date.now() - cached.loadedAt < SNAPSHOT_CACHE_TTL_MS) {
-            for (const [sk, sv] of Object.entries(cached.headers)) {
-                const lower = sk.toLowerCase();
-                if (typeof sv === "string" &&
-                    !headers[lower] &&
-                    !BLOCKED_UPSTREAM_HEADERS.has(lower) &&
-                    lower !== "authorization" &&
-                    lower !== "x-api-key") {
-                    headers[lower] = sv;
-                }
-            }
-            return;
+            return cached.snapshot;
         }
-        const snapshotPath = join(homedir(), ".neurolink", "header-snapshots", `anthropic_${safeLabel}.json`);
+        const snapshotPath = getSnapshotPath(accountLabel);
         try {
             await access(snapshotPath);
         }
         catch {
-            return;
+            return null;
         }
         const snapshot = JSON.parse(await readFile(snapshotPath, "utf8"));
-        if (!snapshot.headers) {
-            return;
+        if (!snapshot || typeof snapshot !== "object") {
+            return null;
+        }
+        const normalized = {
+            accountKey: "accountKey" in snapshot && typeof snapshot.accountKey === "string"
+                ? snapshot.accountKey
+                : `anthropic:${accountLabel}`,
+            capturedAt: "capturedAt" in snapshot && typeof snapshot.capturedAt === "string"
+                ? snapshot.capturedAt
+                : new Date(0).toISOString(),
+            source: "claude-code",
+            headers: "headers" in snapshot && snapshot.headers ? snapshot.headers : {},
+            ...(snapshot.body ? { body: snapshot.body } : {}),
+        };
+        if (Object.keys(normalized.headers).length === 0 && Object.keys(normalized.body ?? {}).length === 0) {
+            return null;
         }
-        // Store in cache
         snapshotCache.set(safeLabel, {
-            headers: snapshot.headers,
+            snapshot: normalized,
             loadedAt: Date.now(),
         });
-        for (const [sk, sv] of Object.entries(snapshot.headers)) {
-            const lower = sk.toLowerCase();
-            if (typeof sv === "string" &&
-                !headers[lower] &&
-                !BLOCKED_UPSTREAM_HEADERS.has(lower) &&
-                lower !== "authorization" &&
-                lower !== "x-api-key") {
-                headers[lower] = sv;
-            }
+        return normalized;
+    }
+    catch {
+        return null;
+    }
+}
+function buildSnapshotHeaders(headers, existingHeaders) {
+    const merged = { ...(existingHeaders ?? {}) };
+    for (const [key, value] of Object.entries(headers)) {
+        const lower = key.toLowerCase();
+        if (typeof value === "string" &&
+            SNAPSHOT_STABLE_HEADERS.has(lower) &&
+            !BLOCKED_UPSTREAM_HEADERS.has(lower) &&
+            lower !== "authorization" &&
+            lower !== "x-api-key" &&
+            lower !== "x-claude-code-session-id") {
+            merged[lower] = value;
         }
     }
+    return merged;
+}
+function extractSnapshotBody(body) {
+    if (!body || typeof body !== "object") {
+        return undefined;
+    }
+    const parsed = body;
+    const identity = parseClaudeCodeUserId(parsed.metadata?.user_id);
+    const systemBlocks = Array.isArray(parsed.system)
+        ? parsed.system
+        : typeof parsed.system === "string"
+            ? [{ type: "text", text: parsed.system }]
+            : [];
+    const billingHeader = systemBlocks.find((block) => typeof block?.text === "string" && block.text.includes("x-anthropic-billing-header"))?.text;
+    const agentBlock = systemBlocks.find((block) => typeof block?.text === "string" && block.text.includes("Claude Agent SDK"))?.text;
+    if (!identity && !billingHeader && !agentBlock) {
+        return undefined;
+    }
+    return {
+        ...(identity ? { metadataUserId: identity.metadataUserId } : {}),
+        ...(identity ? { sessionId: identity.sessionId } : {}),
+        ...(billingHeader ? { billingHeader } : {}),
+        ...(agentBlock ? { agentBlock } : {}),
+    };
+}
+function isLikelyClaudeClient(headers, snapshotBody) {
+    return (typeof headers["x-claude-code-session-id"] === "string" ||
+        headers["user-agent"]?.startsWith("claude-cli/") ||
+        !!snapshotBody?.metadataUserId ||
+        !!snapshotBody?.billingHeader ||
+        !!snapshotBody?.agentBlock);
+}
+function snapshotsMatch(existing, next) {
+    if (!existing) {
+        return false;
+    }
+    return (JSON.stringify(existing.headers ?? {}) === JSON.stringify(next.headers ?? {}) &&
+        JSON.stringify(existing.body ?? {}) === JSON.stringify(next.body ?? {}));
+}
+async function persistClaudeSnapshot(accountLabel, snapshot) {
+    const snapshotPath = getSnapshotPath(accountLabel);
+    const dirPath = join(homedir(), ".neurolink", "header-snapshots");
+    await mkdir(dirPath, { recursive: true });
+    const tmpPath = `${snapshotPath}.tmp`;
+    await writeFile(tmpPath, JSON.stringify(snapshot, null, 2), { mode: 0o600 });
+    await rename(tmpPath, snapshotPath);
+    snapshotCache.set(getSnapshotSafeLabel(accountLabel), {
+        snapshot,
+        loadedAt: Date.now(),
+    });
+}
+async function maybeRefreshClaudeSnapshot(accountLabel, accountKey, headers, bodyStr) {
+    const existing = await loadClaudeSnapshot(accountLabel);
+    let parsedBody;
+    try {
+        parsedBody = JSON.parse(bodyStr);
+    }
     catch {
-        // Snapshot missing or corrupt — continue without it
+        return existing;
+    }
+    const body = extractSnapshotBody(parsedBody);
+    if (!isLikelyClaudeClient(headers, body)) {
+        return existing;
+    }
+    const next = {
+        accountKey,
+        capturedAt: new Date().toISOString(),
+        source: "claude-code",
+        headers: buildSnapshotHeaders(headers, existing?.headers),
+        body: {
+            ...(existing?.body ?? {}),
+            ...(body ?? {}),
+            ...(typeof headers["x-claude-code-session-id"] === "string"
+                ? { sessionId: headers["x-claude-code-session-id"] }
+                : {}),
+        },
+    };
+    if (snapshotsMatch(existing, next)) {
+        return existing;
     }
+    await persistClaudeSnapshot(accountLabel, next);
+    return next;
 }
 /**
  * Polyfill the request body for OAuth accounts.
@@ -149,59 +264,74 @@ async function applyHeaderSnapshot(headers, accountLabel) {
  * into the body.  Non-CC clients (Curator, custom apps) don't send these —
  * Anthropic rejects without them.
  */
-function polyfillOAuthBody(bodyStr, accountToken) {
+function polyfillOAuthBody(bodyStr, accountToken, snapshot, preferredSessionId) {
     try {
         const parsed = JSON.parse(bodyStr);
         // Billing header block (required by Anthropic for OAuth)
-        const randomHex = Math.random().toString(16).substring(2, 5);
-        const billingBlock = {
-            type: "text",
-            text: `x-anthropic-billing-header: cc_version=2.1.86.${randomHex}; cc_entrypoint=cli; cch=proxy;`,
-        };
+        // NOTE: This block MUST be deterministic (no random values) to preserve
+        // Anthropic's prompt caching prefix chain. We keep the real Claude Code
+        // version/entrypoint shape when present, but stabilize the volatile cch.
         const agentBlock = {
             type: "text",
-            text: "You are a Claude agent, built on Anthropic's Claude Agent SDK.",
+            text: snapshot?.body?.agentBlock || "You are a Claude agent, built on Anthropic's Claude Agent SDK.",
         };
-        // Normalise system to array and prepend billing + agent
+        // Normalise system to array and APPEND billing + agent blocks.
+        // IMPORTANT: We append (not prepend) to preserve the client's cache
+        // prefix chain. Anthropic's prompt caching uses prefix matching — if we
+        // insert anything before the client's system blocks, we invalidate all
+        // cached content (tools, system prompt, message history).
+        //
+        // Claude Code sends a billing block with a `cch=<hash>` value that changes
+        // on every request. We fix this by:
+        //   1. Removing the client's billing block from its current position
+        //   2. Stabilizing it while keeping the official Claude Code shape
+        //   3. Appending it at the END so the cacheable system blocks stay
+        //      at the front of the prefix chain
         if (parsed.system) {
             if (typeof parsed.system === "string") {
                 parsed.system = [{ type: "text", text: parsed.system }];
             }
             if (Array.isArray(parsed.system)) {
-                const hasBilling = parsed.system.some((b) => typeof b.text === "string" &&
-                    b.text.includes("x-anthropic-billing-header"));
-                const hasAgent = parsed.system.some((b) => typeof b.text === "string" && b.text.includes("Claude Agent SDK"));
-                const toInsert = [];
-                if (!hasBilling) {
-                    toInsert.push(billingBlock);
-                }
-                if (!hasAgent) {
-                    toInsert.push(agentBlock);
-                }
-                if (toInsert.length > 0) {
-                    parsed.system = [...toInsert, ...parsed.system];
+                // Find and remove existing billing/agent blocks from wherever
+                // the client placed them (typically at system[0])
+                const billingIdx = parsed.system.findIndex((b) => typeof b.text === "string" && b.text.includes("x-anthropic-billing-header"));
+                const agentIdx = parsed.system.findIndex((b) => typeof b.text === "string" && b.text.includes("Claude Agent SDK"));
+                const billingBlock = {
+                    type: "text",
+                    text: buildStableClaudeCodeBillingHeader(parsed.system[billingIdx]?.text ?? snapshot?.body?.billingHeader),
+                };
+                // Remove in reverse index order so indices stay valid
+                const indicesToRemove = [billingIdx, agentIdx].filter((i) => i >= 0).sort((a, b) => b - a);
+                for (const idx of indicesToRemove) {
+                    parsed.system.splice(idx, 1);
                 }
+                // Always append a deterministic billing block at the end.
+                // If the client sent one, we stripped its dynamic cch= and use
+                // our stable version instead. If not, we add ours.
+                parsed.system = [...parsed.system, billingBlock, agentBlock];
             }
         }
         else {
-            parsed.system = [billingBlock, agentBlock];
-        }
-        // Inject metadata.user_id (required for OAuth)
-        if (!parsed.metadata?.user_id) {
-            const tokenPrefix = accountToken.substring(0, Math.min(20, accountToken.length));
-            const hash = Array.from(new TextEncoder().encode(tokenPrefix))
-                .reduce((a, b) => ((a << 5) - a + b) | 0, 0)
-                .toString(16)
-                .replace("-", "");
-            parsed.metadata = {
-                ...parsed.metadata,
-                user_id: `proxy-${hash}`,
+            const billingBlock = {
+                type: "text",
+                text: buildStableClaudeCodeBillingHeader(snapshot?.body?.billingHeader),
             };
+            parsed.system = [billingBlock, agentBlock];
         }
-        return JSON.stringify(parsed);
+        // Inject Claude-Code-shaped metadata.user_id (required for OAuth).
+        const tokenPrefix = accountToken.substring(0, Math.min(20, accountToken.length));
+        const identity = getOrCreateClaudeCodeIdentity(tokenPrefix, {
+            existingUserId: parsed.metadata?.user_id ?? snapshot?.body?.metadataUserId,
+            preferredSessionId: preferredSessionId ?? snapshot?.body?.sessionId,
+        });
+        parsed.metadata = {
+            ...parsed.metadata,
+            user_id: identity.metadataUserId,
+        };
+        return { bodyStr: JSON.stringify(parsed), sessionId: identity.sessionId };
     }
     catch {
-        return bodyStr; // JSON parse failed — use original body
+        return { bodyStr }; // JSON parse failed — use original body
     }
 }
 // ---------------------------------------------------------------------------
@@ -269,7 +399,8 @@ async function tryLoadLegacyAccount(creds, legacyCredPath) {
  * @param basePath    - Base path prefix (default: "" since Claude API uses /v1/...).
  * @returns RouteGroup with Claude-compatible endpoints.
  */
-export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrategy = "fill-first") {
+// eslint-disable-next-line max-lines-per-function
+export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrategy = "fill-first", passthroughMode = false) {
     return {
         prefix: `${basePath}/v1`,
         routes: [
@@ -282,8 +413,7 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                 handler: async (ctx) => {
                     const body = ctx.body;
                     // 1. Validate
-                    if (typeof body?.model !== "string" ||
-                        !Array.isArray(body?.messages)) {
+                    if (typeof body?.model !== "string" || !Array.isArray(body?.messages)) {
                         return buildClaudeError(400, "Missing required fields: model, messages");
                     }
                     // 2. Resolve model via router (or pass through to anthropic)
@@ -298,15 +428,476 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                         provider: "anthropic",
                         model: body.model,
                     };
+                    const clientRequestBody = JSON.stringify(body);
+                    // ── OTel tracing ──────────────────────────────────────
+                    let tracer;
+                    try {
+                        tracer = ProxyTracer.startRequest({
+                            requestId: ctx.requestId,
+                            method: ctx.method,
+                            path: ctx.path,
+                            model: body.model,
+                            stream: body.stream ?? false,
+                            toolCount: Array.isArray(body.tools) ? body.tools.length : 0,
+                            sessionId: ctx.headers["x-neurolink-session-id"] ?? ctx.headers["x-claude-code-session-id"] ?? undefined,
+                            userAgent: ctx.headers["user-agent"] ?? undefined,
+                        }, ctx.headers);
+                        const receiveSpan = tracer.startReceive();
+                        tracer.logRequestHeaders(ctx.headers);
+                        tracer.logRequestBody(clientRequestBody);
+                        receiveSpan.end();
+                    }
+                    catch {
+                        // Graceful degradation — continue without tracing
+                        tracer = undefined;
+                    }
+                    const requestStartTime = Date.now();
+                    const logProxyBody = (capture) => {
+                        const traceCtx = tracer?.getTraceContext();
+                        void logBodyCapture({
+                            timestamp: new Date().toISOString(),
+                            requestId: ctx.requestId,
+                            model: body.model,
+                            stream: body.stream ?? false,
+                            ...capture,
+                            ...(traceCtx ? { traceId: traceCtx.traceId, spanId: traceCtx.spanId } : {}),
+                        });
+                    };
+                    const logFinalRequest = (status, accountLabel, accountType, errorType, errorMessage, extra) => {
+                        const traceCtx = tracer?.getTraceContext();
+                        logRequest({
+                            timestamp: new Date().toISOString(),
+                            requestId: ctx.requestId,
+                            method: ctx.method,
+                            path: ctx.path,
+                            model: body.model,
+                            stream: !!body.stream,
+                            toolCount: Array.isArray(body.tools) ? body.tools.length : 0,
+                            account: accountLabel,
+                            accountType,
+                            responseStatus: status,
+                            responseTimeMs: Date.now() - requestStartTime,
+                            ...(errorType ? { errorType } : {}),
+                            ...(errorMessage ? { errorMessage } : {}),
+                            ...(extra?.inputTokens !== undefined ? { inputTokens: extra.inputTokens } : {}),
+                            ...(extra?.outputTokens !== undefined ? { outputTokens: extra.outputTokens } : {}),
+                            ...(extra?.cacheCreationTokens !== undefined ? { cacheCreationTokens: extra.cacheCreationTokens } : {}),
+                            ...(extra?.cacheReadTokens !== undefined ? { cacheReadTokens: extra.cacheReadTokens } : {}),
+                            ...(traceCtx ? { traceId: traceCtx.traceId, spanId: traceCtx.spanId } : {}),
+                        });
+                    };
+                    logProxyBody({
+                        phase: "client_request",
+                        headers: ctx.headers,
+                        body: clientRequestBody,
+                        bodySize: Buffer.byteLength(clientRequestBody, "utf8"),
+                        contentType: ctx.headers["content-type"] ?? "application/json",
+                    });
+                    const buildLoggedClaudeError = (status, message, errorType, extra) => {
+                        const errorBody = buildClaudeError(status, message, errorType);
+                        const errorBodyText = JSON.stringify(errorBody);
+                        recordFinalError(status, extra?.account, extra?.accountType);
+                        logFinalRequest(status, extra?.account ?? "", extra?.accountType ?? "final", errorType, message);
+                        logProxyBody({
+                            phase: "client_response",
+                            headers: { "content-type": "application/json" },
+                            body: errorBodyText,
+                            bodySize: Buffer.byteLength(errorBodyText, "utf8"),
+                            contentType: "application/json",
+                            responseStatus: status,
+                            durationMs: Date.now() - requestStartTime,
+                            ...extra,
+                        });
+                        return errorBody;
+                    };
                     try {
                         // 3. Route based on target provider
                         if (route.provider === null) {
-                            return buildClaudeError(404, `Model '${body.model}' is not a Claude model. ` +
-                                `Use a model router to route it to another provider.`);
+                            tracer?.setError("not_found_error", `Model '${body.model}' is not a Claude model.`);
+                            tracer?.end(404, Date.now() - requestStartTime);
+                            return buildLoggedClaudeError(404, `Model '${body.model}' is not a Claude model. ` + `Use a model router to route it to another provider.`);
                         }
                         const isClaudeTarget = route.provider === "anthropic";
                         if (isClaudeTarget) {
-                            // ─── PASSTHROUGH MODE (Claude → Claude) ───────────────
+                            // --- PASSTHROUGH MODE (Claude -> Claude) -------------------
+                            tracer?.setMode("passthrough");
+                            // ── CLI --passthrough: raw transparent forwarding ──────
+                            if (passthroughMode) {
+                                tracer?.setMode("passthrough-cli");
+                                const bodyStr = clientRequestBody;
+                                const toolCount = Array.isArray(body.tools) ? body.tools.length : 0;
+                                // Forward client headers as-is, filtering blocked ones
+                                const upstreamHeaders = {};
+                                for (const [key, value] of Object.entries(ctx.headers)) {
+                                    if (!BLOCKED_UPSTREAM_HEADERS.has(key.toLowerCase()) && value) {
+                                        upstreamHeaders[key] = value;
+                                    }
+                                }
+                                // Ensure content-type is set
+                                if (!upstreamHeaders["content-type"]) {
+                                    upstreamHeaders["content-type"] = "application/json";
+                                }
+                                const upstreamSpan = tracer?.startUpstreamAttempt({
+                                    account: "passthrough",
+                                    attempt: 1,
+                                    polyfillHeaders: false,
+                                    polyfillBody: false,
+                                    upstreamUrl: "https://api.anthropic.com/v1/messages?beta=true",
+                                });
+                                tracer?.logUpstreamRequestHeaders(upstreamHeaders);
+                                tracer?.logUpstreamRequestBody(bodyStr);
+                                logProxyBody({
+                                    phase: "upstream_request",
+                                    headers: upstreamHeaders,
+                                    body: bodyStr,
+                                    bodySize: Buffer.byteLength(bodyStr, "utf8"),
+                                    contentType: upstreamHeaders["content-type"] ?? "application/json",
+                                    account: "passthrough",
+                                    accountType: "passthrough",
+                                    attempt: 1,
+                                });
+                                let response;
+                                try {
+                                    response = await fetch("https://api.anthropic.com/v1/messages?beta=true", {
+                                        method: "POST",
+                                        headers: upstreamHeaders,
+                                        body: bodyStr,
+                                        signal: AbortSignal.timeout(UPSTREAM_FETCH_TIMEOUT_MS),
+                                    });
+                                }
+                                catch (fetchErr) {
+                                    const errMsg = fetchErr instanceof Error ? fetchErr.message : String(fetchErr);
+                                    tracer?.setError("network_error", errMsg);
+                                    upstreamSpan?.end();
+                                    tracer?.end(502, Date.now() - requestStartTime);
+                                    logRequest({
+                                        timestamp: new Date().toISOString(),
+                                        requestId: ctx.requestId,
+                                        method: ctx.method,
+                                        path: ctx.path,
+                                        model: body.model,
+                                        stream: body.stream ?? false,
+                                        toolCount,
+                                        account: "passthrough",
+                                        accountType: "passthrough",
+                                        responseStatus: 502,
+                                        responseTimeMs: Date.now() - requestStartTime,
+                                        errorType: "network_error",
+                                        errorMessage: errMsg,
+                                    });
+                                    const errorBody = buildClaudeError(502, `Passthrough fetch failed: ${errMsg}`);
+                                    logProxyBody({
+                                        phase: "client_response",
+                                        headers: { "content-type": "application/json" },
+                                        body: JSON.stringify(errorBody),
+                                        bodySize: Buffer.byteLength(JSON.stringify(errorBody), "utf8"),
+                                        contentType: "application/json",
+                                        account: "passthrough",
+                                        accountType: "passthrough",
+                                        attempt: 1,
+                                        responseStatus: 502,
+                                        durationMs: Date.now() - requestStartTime,
+                                    });
+                                    return errorBody;
+                                }
+                                const upstreamResponseHeaders = {};
+                                response.headers.forEach((v, k) => {
+                                    upstreamResponseHeaders[k] = v;
+                                });
+                                tracer?.logUpstreamResponseHeaders(upstreamResponseHeaders);
+                                if (!response.ok) {
+                                    const errorText = await response.text();
+                                    tracer?.logUpstreamResponseBody(errorText);
+                                    logProxyBody({
+                                        phase: "upstream_response",
+                                        headers: upstreamResponseHeaders,
+                                        body: errorText,
+                                        bodySize: Buffer.byteLength(errorText, "utf8"),
+                                        contentType: upstreamResponseHeaders["content-type"] ?? "application/json",
+                                        account: "passthrough",
+                                        accountType: "passthrough",
+                                        attempt: 1,
+                                        responseStatus: response.status,
+                                        durationMs: Date.now() - requestStartTime,
+                                    });
+                                    logProxyBody({
+                                        phase: "client_response",
+                                        headers: upstreamResponseHeaders,
+                                        body: errorText,
+                                        bodySize: Buffer.byteLength(errorText, "utf8"),
+                                        contentType: upstreamResponseHeaders["content-type"] ?? "application/json",
+                                        account: "passthrough",
+                                        accountType: "passthrough",
+                                        attempt: 1,
+                                        responseStatus: response.status,
+                                        durationMs: Date.now() - requestStartTime,
+                                    });
+                                    upstreamSpan?.end();
+                                    tracer?.setError("api_error", errorText.slice(0, 500));
+                                    tracer?.end(response.status, Date.now() - requestStartTime);
+                                    try {
+                                        return JSON.parse(errorText);
+                                    }
+                                    catch {
+                                        return buildClaudeError(response.status, errorText);
+                                    }
+                                }
+                                // Streaming response
+                                if (body.stream && response.body) {
+                                    const responseHeaders = { ...upstreamResponseHeaders };
+                                    const { stream: clientCaptureStream, capture: clientCapture } = createRawStreamCapture();
+                                    let streamSource = response.body;
+                                    if (tracer) {
+                                        try {
+                                            const { stream: interceptor, telemetry } = createSSEInterceptor({ captureRawText: true });
+                                            streamSource = streamSource.pipeThrough(interceptor);
+                                            const capturedTracer = tracer;
+                                            const capturedUpstreamSpan = upstreamSpan;
+                                            const capturedResponse = response;
+                                            const capturedRequestBytes = bodyStr.length;
+                                            Promise.all([telemetry, clientCapture])
+                                                .then(([data, clientBody]) => {
+                                                capturedTracer.setUsage({
+                                                    inputTokens: data.usage.inputTokens,
+                                                    outputTokens: data.usage.outputTokens,
+                                                    cacheCreationTokens: data.usage.cacheCreationInputTokens,
+                                                    cacheReadTokens: data.usage.cacheReadInputTokens,
+                                                });
+                                                capturedTracer.logStreamEvents(data.events);
+                                                const rateLimit5h = parseFloat(capturedResponse.headers.get("anthropic-ratelimit-unified-5h-utilization") ?? "");
+                                                const rateLimit7d = parseFloat(capturedResponse.headers.get("anthropic-ratelimit-unified-7d-utilization") ?? "");
+                                                const usageUpdate = {
+                                                    inputTokens: data.usage.inputTokens,
+                                                    outputTokens: data.usage.outputTokens,
+                                                    cacheCreationTokens: data.usage.cacheCreationInputTokens,
+                                                    cacheReadTokens: data.usage.cacheReadInputTokens,
+                                                };
+                                                if (!isNaN(rateLimit5h)) {
+                                                    usageUpdate.rateLimitAfter5h = rateLimit5h;
+                                                }
+                                                if (!isNaN(rateLimit7d)) {
+                                                    usageUpdate.rateLimitAfter7d = rateLimit7d;
+                                                }
+                                                if (!isNaN(rateLimit5h) || !isNaN(rateLimit7d)) {
+                                                    capturedTracer.setUsage(usageUpdate);
+                                                }
+                                                capturedTracer.logUpstreamResponseBody(data.rawText ?? "");
+                                                capturedTracer.recordMetrics();
+                                                capturedTracer.recordBodySizes(capturedRequestBytes, data.totalBytesReceived);
+                                                capturedUpstreamSpan?.end();
+                                                capturedTracer.end(200, Date.now() - requestStartTime);
+                                                const traceCtx = capturedTracer.getTraceContext();
+                                                logRequest({
+                                                    timestamp: new Date().toISOString(),
+                                                    requestId: ctx.requestId,
+                                                    method: ctx.method,
+                                                    path: ctx.path,
+                                                    model: body.model,
+                                                    stream: true,
+                                                    toolCount,
+                                                    account: "passthrough",
+                                                    accountType: "passthrough",
+                                                    responseStatus: 200,
+                                                    responseTimeMs: Date.now() - requestStartTime,
+                                                    inputTokens: data.usage.inputTokens,
+                                                    outputTokens: data.usage.outputTokens,
+                                                    cacheCreationTokens: data.usage.cacheCreationInputTokens,
+                                                    cacheReadTokens: data.usage.cacheReadInputTokens,
+                                                    traceId: traceCtx.traceId,
+                                                    spanId: traceCtx.spanId,
+                                                });
+                                                logProxyBody({
+                                                    phase: "upstream_response",
+                                                    headers: responseHeaders,
+                                                    body: data.rawText ?? "",
+                                                    bodySize: data.totalBytesReceived,
+                                                    contentType: responseHeaders["content-type"] ?? "text/event-stream",
+                                                    account: "passthrough",
+                                                    accountType: "passthrough",
+                                                    attempt: 1,
+                                                    responseStatus: 200,
+                                                    durationMs: Date.now() - requestStartTime,
+                                                });
+                                                logProxyBody({
+                                                    phase: "client_response",
+                                                    headers: responseHeaders,
+                                                    body: clientBody.text,
+                                                    bodySize: clientBody.totalBytes,
+                                                    contentType: responseHeaders["content-type"] ?? "text/event-stream",
+                                                    account: "passthrough",
+                                                    accountType: "passthrough",
+                                                    attempt: 1,
+                                                    responseStatus: 200,
+                                                    durationMs: Date.now() - requestStartTime,
+                                                });
+                                            })
+                                                .catch((err) => {
+                                                capturedTracer.setError("stream_error", err instanceof Error ? err.message : String(err));
+                                                capturedUpstreamSpan?.end();
+                                                capturedTracer.end(500, Date.now() - requestStartTime);
+                                                const traceCtx = capturedTracer.getTraceContext();
+                                                logRequest({
+                                                    timestamp: new Date().toISOString(),
+                                                    requestId: ctx.requestId,
+                                                    method: ctx.method,
+                                                    path: ctx.path,
+                                                    model: body.model,
+                                                    stream: true,
+                                                    toolCount,
+                                                    account: "passthrough",
+                                                    accountType: "passthrough",
+                                                    responseStatus: 500,
+                                                    responseTimeMs: Date.now() - requestStartTime,
+                                                    errorType: "stream_error",
+                                                    errorMessage: err instanceof Error ? err.message : String(err),
+                                                    traceId: traceCtx.traceId,
+                                                    spanId: traceCtx.spanId,
+                                                });
+                                            });
+                                        }
+                                        catch {
+                                            // Streaming capture is best-effort; request completion is handled elsewhere.
+                                        }
+                                    }
+                                    else {
+                                        clientCapture
+                                            .then((clientBody) => {
+                                            logProxyBody({
+                                                phase: "upstream_response",
+                                                headers: responseHeaders,
+                                                body: clientBody.text,
+                                                bodySize: clientBody.totalBytes,
+                                                contentType: responseHeaders["content-type"] ?? "text/event-stream",
+                                                account: "passthrough",
+                                                accountType: "passthrough",
+                                                attempt: 1,
+                                                responseStatus: 200,
+                                                durationMs: Date.now() - requestStartTime,
+                                            });
+                                            logProxyBody({
+                                                phase: "client_response",
+                                                headers: responseHeaders,
+                                                body: clientBody.text,
+                                                bodySize: clientBody.totalBytes,
+                                                contentType: responseHeaders["content-type"] ?? "text/event-stream",
+                                                account: "passthrough",
+                                                accountType: "passthrough",
+                                                attempt: 1,
+                                                responseStatus: 200,
+                                                durationMs: Date.now() - requestStartTime,
+                                            });
+                                        })
+                                            .catch(() => {
+                                            // Non-fatal
+                                        });
+                                    }
+                                    const clientStream = streamSource.pipeThrough(clientCaptureStream);
+                                    return new Response(clientStream, {
+                                        status: response.status,
+                                        headers: responseHeaders,
+                                    });
+                                }
+                                // Non-streaming response
+                                const responseText = await response.text();
+                                tracer?.logUpstreamResponseBody(responseText);
+                                logProxyBody({
+                                    phase: "upstream_response",
+                                    headers: upstreamResponseHeaders,
+                                    body: responseText,
+                                    bodySize: Buffer.byteLength(responseText, "utf8"),
+                                    contentType: upstreamResponseHeaders["content-type"] ?? "application/json",
+                                    account: "passthrough",
+                                    accountType: "passthrough",
+                                    attempt: 1,
+                                    responseStatus: response.status,
+                                    durationMs: Date.now() - requestStartTime,
+                                });
+                                logProxyBody({
+                                    phase: "client_response",
+                                    headers: upstreamResponseHeaders,
+                                    body: responseText,
+                                    bodySize: Buffer.byteLength(responseText, "utf8"),
+                                    contentType: upstreamResponseHeaders["content-type"] ?? "application/json",
+                                    account: "passthrough",
+                                    accountType: "passthrough",
+                                    attempt: 1,
+                                    responseStatus: response.status,
+                                    durationMs: Date.now() - requestStartTime,
+                                });
+                                const responseJson = JSON.parse(responseText);
+                                if (tracer && responseJson && typeof responseJson === "object") {
+                                    const usage = responseJson.usage;
+                                    if (usage) {
+                                        tracer.setUsage({
+                                            inputTokens: usage.input_tokens ?? 0,
+                                            outputTokens: usage.output_tokens ?? 0,
+                                            cacheCreationTokens: usage.cache_creation_input_tokens ?? 0,
+                                            cacheReadTokens: usage.cache_read_input_tokens ?? 0,
+                                        });
+                                        const rateLimit5h = parseFloat(response.headers.get("anthropic-ratelimit-unified-5h-utilization") ?? "");
+                                        const rateLimit7d = parseFloat(response.headers.get("anthropic-ratelimit-unified-7d-utilization") ?? "");
+                                        if (!isNaN(rateLimit5h) || !isNaN(rateLimit7d)) {
+                                            const usageWithRates = {
+                                                inputTokens: usage.input_tokens ?? 0,
+                                                outputTokens: usage.output_tokens ?? 0,
+                                                cacheCreationTokens: usage.cache_creation_input_tokens ?? 0,
+                                                cacheReadTokens: usage.cache_read_input_tokens ?? 0,
+                                            };
+                                            if (!isNaN(rateLimit5h)) {
+                                                usageWithRates.rateLimitAfter5h = rateLimit5h;
+                                            }
+                                            if (!isNaN(rateLimit7d)) {
+                                                usageWithRates.rateLimitAfter7d = rateLimit7d;
+                                            }
+                                            tracer.setUsage(usageWithRates);
+                                        }
+                                    }
+                                    tracer.recordMetrics();
+                                    const responseJsonStr = JSON.stringify(responseJson);
+                                    tracer.recordBodySizes(bodyStr.length, responseJsonStr.length);
+                                    upstreamSpan?.end();
+                                    tracer.end(response.status, Date.now() - requestStartTime);
+                                    const traceCtx = tracer.getTraceContext();
+                                    logRequest({
+                                        timestamp: new Date().toISOString(),
+                                        requestId: ctx.requestId,
+                                        method: ctx.method,
+                                        path: ctx.path,
+                                        model: body.model,
+                                        stream: false,
+                                        toolCount,
+                                        account: "passthrough",
+                                        accountType: "passthrough",
+                                        responseStatus: response.status,
+                                        responseTimeMs: Date.now() - requestStartTime,
+                                        inputTokens: usage?.input_tokens,
+                                        outputTokens: usage?.output_tokens,
+                                        cacheCreationTokens: usage?.cache_creation_input_tokens,
+                                        cacheReadTokens: usage?.cache_read_input_tokens,
+                                        traceId: traceCtx.traceId,
+                                        spanId: traceCtx.spanId,
+                                    });
+                                }
+                                else {
+                                    upstreamSpan?.end();
+                                    tracer?.end(response.status, Date.now() - requestStartTime);
+                                    logRequest({
+                                        timestamp: new Date().toISOString(),
+                                        requestId: ctx.requestId,
+                                        method: ctx.method,
+                                        path: ctx.path,
+                                        model: body.model,
+                                        stream: false,
+                                        toolCount,
+                                        account: "passthrough",
+                                        accountType: "passthrough",
+                                        responseStatus: response.status,
+                                        responseTimeMs: Date.now() - requestStartTime,
+                                    });
+                                }
+                                return responseJson;
+                            }
+                            // ── END CLI --passthrough ─────────────────────────────
                             const fs = await import("fs");
                             const os = await import("os");
                             const accounts = [];
@@ -330,8 +921,7 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                     // On cold start, lastToken is empty — don't treat that as a
                                     // credential change; only compare on subsequent reloads.
                                     const tokens = await tokenStore.loadTokens(key);
-                                    const hasTrackedTokens = existingState.lastToken !== undefined &&
-                                        existingState.lastToken !== "";
+                                    const hasTrackedTokens = existingState.lastToken !== undefined && existingState.lastToken !== "";
                                     const tokenChanged = tokens &&
                                         hasTrackedTokens &&
                                         (existingState.lastToken !== tokens.accessToken ||
@@ -436,13 +1026,14 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                 });
                             }
                             if (accounts.length === 0) {
-                                return buildClaudeError(401, "No Anthropic credentials found");
+                                tracer?.setError("authentication_error", "No Anthropic credentials found");
+                                tracer?.end(401, Date.now() - requestStartTime);
+                                return buildLoggedClaudeError(401, "No Anthropic credentials found");
                             }
                             // Sync in-memory runtime state with current token material.
                             for (const account of accounts) {
                                 const state = getOrCreateRuntimeState(account.key);
-                                const tokenChanged = state.lastToken !== account.token ||
-                                    state.lastRefreshToken !== account.refreshToken;
+                                const tokenChanged = state.lastToken !== account.token || state.lastRefreshToken !== account.refreshToken;
                                 if (tokenChanged) {
                                     if (state.permanentlyDisabled) {
                                         logger.always(`[proxy] account=${account.label} credentials changed, re-enabling`);
@@ -456,11 +1047,13 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                 state.lastRefreshToken = account.refreshToken;
                             }
                             const enabledAccounts = accounts.filter((account) => {
-                                return !getOrCreateRuntimeState(account.key)
-                                    .permanentlyDisabled;
+                                return !getOrCreateRuntimeState(account.key).permanentlyDisabled;
                             });
                             if (enabledAccounts.length === 0) {
-                                return buildClaudeError(401, formatReauthMessage(accounts.map((account) => account.label)));
+                                const reauthMsg = formatReauthMessage(accounts.map((account) => account.label));
+                                tracer?.setError("authentication_error", reauthMsg);
+                                tracer?.end(401, Date.now() - requestStartTime);
+                                return buildLoggedClaudeError(401, reauthMsg);
                             }
                             // Order accounts based on the configured strategy.
                             // - fill-first: always start with the primary account;
@@ -472,8 +1065,7 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                             // (e.g. a new account was authenticated while the proxy was running).
                             // Only applies to round-robin; fill-first uses primaryAccountIndex
                             // as a sticky primary and should not be disrupted.
-                            if (accountStrategy === "round-robin" &&
-                                orderedAccounts.length !== lastKnownAccountCount) {
+                            if (accountStrategy === "round-robin" && orderedAccounts.length !== lastKnownAccountCount) {
                                 primaryAccountIndex = 0;
                                 lastKnownAccountCount = orderedAccounts.length;
                             }
@@ -481,8 +1073,7 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                 if (accountStrategy === "round-robin") {
                                     // Advance the index on every request for even distribution
                                     const idx = primaryAccountIndex % orderedAccounts.length;
-                                    primaryAccountIndex =
-                                        (primaryAccountIndex + 1) % orderedAccounts.length;
+                                    primaryAccountIndex = (primaryAccountIndex + 1) % orderedAccounts.length;
                                     if (idx > 0) {
                                         const head = orderedAccounts.splice(0, idx);
                                         orderedAccounts.push(...head);
@@ -501,24 +1092,30 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                             let sawRateLimit = false;
                             let sawNetworkError = false;
                             let sawTransientFailure = false;
+                            let invalidRequestFailure = null;
                             let authFailureMessage = null;
-                            const bodyStr = JSON.stringify(body);
+                            const normalizedAnthropicBody = normalizeClaudeRequestForAnthropic(body);
+                            const bodyStr = JSON.stringify(normalizedAnthropicBody);
                             const requestStart = Date.now();
-                            const toolCount = Array.isArray(body.tools)
-                                ? body.tools.length
-                                : 0;
+                            const toolCount = Array.isArray(body.tools) ? body.tools.length : 0;
                             const url = "https://api.anthropic.com/v1/messages?beta=true";
                             const clientHeaders = ctx.headers ?? {};
+                            const clientSnapshotBody = extractSnapshotBody(body);
+                            const isClaudeClientRequest = isLikelyClaudeClient(clientHeaders, clientSnapshotBody);
+                            let attemptNumber = 0;
+                            // OTel: account selection span (covers the whole selection phase)
+                            const acctSelectionSpan = tracer?.startAccountSelection();
                             for (const account of orderedAccounts) {
                                 const accountState = getOrCreateRuntimeState(account.key);
-                                if (accountState.coolingUntil &&
-                                    accountState.coolingUntil > Date.now()) {
+                                if (accountState.coolingUntil && accountState.coolingUntil > Date.now()) {
                                     continue;
                                 }
-                                const logAttempt = (status, errorType, errorMessage) => {
-                                    logRequest({
+                                const logAttempt = (status, errorType, errorMessage, extra) => {
+                                    const traceCtx = tracer?.getTraceContext();
+                                    logRequestAttempt({
                                         timestamp: new Date().toISOString(),
                                         requestId: ctx.requestId,
+                                        attempt: attemptNumber,
                                         method: ctx.method,
                                         path: ctx.path,
                                         model: body.model,
@@ -530,8 +1127,31 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                         responseTimeMs: Date.now() - requestStart,
                                         ...(errorType ? { errorType } : {}),
                                         ...(errorMessage ? { errorMessage } : {}),
+                                        ...(extra?.inputTokens !== undefined ? { inputTokens: extra.inputTokens } : {}),
+                                        ...(extra?.outputTokens !== undefined ? { outputTokens: extra.outputTokens } : {}),
+                                        ...(extra?.cacheCreationTokens !== undefined
+                                            ? { cacheCreationTokens: extra.cacheCreationTokens }
+                                            : {}),
+                                        ...(extra?.cacheReadTokens !== undefined ? { cacheReadTokens: extra.cacheReadTokens } : {}),
+                                        ...(traceCtx ? { traceId: traceCtx.traceId, spanId: traceCtx.spanId } : {}),
                                     });
                                 };
+                                // OTel: record account selection and start upstream attempt span
+                                attemptNumber++;
+                                if (tracer) {
+                                    // End the selection span on first actual attempt
+                                    if (attemptNumber === 1 && acctSelectionSpan) {
+                                        tracer.setAccountSelection({
+                                            strategy: accountStrategy,
+                                            accountsTotal: accounts.length,
+                                            accountsHealthy: enabledAccounts.length,
+                                            selectedAccount: account.label,
+                                            accountType: account.type,
+                                        });
+                                        acctSelectionSpan.end();
+                                    }
+                                }
+                                let upstreamSpan;
                                 // Auto-refresh expiring access tokens once before making the request.
                                 if (needsRefresh(account)) {
                                     const refreshed = await refreshToken(account);
@@ -545,8 +1165,7 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                         accountState.consecutiveRefreshFailures += 1;
                                         lastError = `token refresh failed for account=${account.label}: ${refreshed.error?.slice(0, 200) ?? "unknown"}`;
                                         logger.debug(`[proxy] preflight refresh failed account=${account.label} failures=${accountState.consecutiveRefreshFailures}`);
-                                        if (accountState.consecutiveRefreshFailures >=
-                                            MAX_CONSECUTIVE_REFRESH_FAILURES) {
+                                        if (accountState.consecutiveRefreshFailures >= MAX_CONSECUTIVE_REFRESH_FAILURES) {
                                             await disableAccountUntilReauth(account, accountState);
                                             authFailureMessage = formatReauthMessage(account.label);
                                             logAttempt(401, "authentication_error", String(lastError));
@@ -555,6 +1174,9 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                     }
                                 }
                                 const isOAuth = account.type === "oauth";
+                                const snapshot = isOAuth
+                                    ? await maybeRefreshClaudeSnapshot(account.label, account.key, clientHeaders, bodyStr)
+                                    : null;
                                 // Decision 6: Passthrough client headers, fill gaps only.
                                 // Start with a copy of incoming client headers, then set
                                 // defaults for anything the client didn't send. Always
@@ -562,8 +1184,7 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                 const headers = {};
                                 for (const [hk, hv] of Object.entries(clientHeaders)) {
                                     const lower = hk.toLowerCase();
-                                    if (typeof hv === "string" &&
-                                        !BLOCKED_UPSTREAM_HEADERS.has(lower)) {
+                                    if (typeof hv === "string" && !BLOCKED_UPSTREAM_HEADERS.has(lower)) {
                                         headers[lower] = hv;
                                     }
                                 }
@@ -579,11 +1200,11 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                 }
                                 // Apply header snapshot defaults for OAuth accounts
                                 if (isOAuth) {
-                                    await applyHeaderSnapshot(headers, account.label);
+                                    applySnapshotHeaders(headers, snapshot);
                                 }
                                 // Hard defaults for anything still missing
                                 if (!headers["user-agent"]) {
-                                    headers["user-agent"] = "claude-cli/2.1.86 (external, cli)";
+                                    headers["user-agent"] = CLAUDE_CLI_USER_AGENT;
                                 }
                                 if (!headers["anthropic-version"]) {
                                     headers["anthropic-version"] = "2023-06-01";
@@ -591,15 +1212,25 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                 if (!headers["anthropic-dangerous-direct-browser-access"]) {
                                     headers["anthropic-dangerous-direct-browser-access"] = "true";
                                 }
+                                if (!headers["x-app"]) {
+                                    headers["x-app"] = "cli";
+                                }
+                                if (!headers["accept"]) {
+                                    headers["accept"] = "application/json";
+                                }
                                 // Manage anthropic-beta header based on auth type.
                                 // OAuth requires specific betas; API-key must NOT carry them.
                                 if (isOAuth) {
-                                    const existing = new Set((headers["anthropic-beta"] ?? "")
+                                    const betaSeed = isClaudeClientRequest
+                                        ? (headers["anthropic-beta"] ?? "")
+                                        : (clientHeaders["anthropic-beta"] ?? "");
+                                    const existing = new Set(betaSeed
                                         .split(",")
                                         .map((s) => s.trim())
                                         .filter(Boolean));
-                                    existing.add("oauth-2025-04-20");
-                                    existing.add("claude-code-20250219");
+                                    for (const beta of isClaudeClientRequest ? CLAUDE_CODE_OAUTH_BETAS : NON_CLAUDE_OAUTH_BETAS) {
+                                        existing.add(beta);
+                                    }
                                     headers["anthropic-beta"] = [...existing].join(",");
                                 }
                                 else {
@@ -607,7 +1238,7 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                     const cleaned = (headers["anthropic-beta"] ?? "")
                                         .split(",")
                                         .map((s) => s.trim())
-                                        .filter((s) => s && s !== "oauth-2025-04-20")
+                                        .filter((s) => s && !CLAUDE_CODE_OAUTH_BETAS.includes(s))
                                         .join(",");
                                     if (cleaned) {
                                         headers["anthropic-beta"] = cleaned;
@@ -616,13 +1247,46 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                         delete headers["anthropic-beta"];
                                     }
                                 }
-                                // Polyfill request body for OAuth accounts
-                                const buildUpstreamBody = () => isOAuth ? polyfillOAuthBody(bodyStr, account.token) : bodyStr;
-                                const finalBodyStr = buildUpstreamBody();
+                                // Polyfill request body for ALL OAuth accounts.
+                                // Anthropic requires metadata.user_id and billing headers
+                                // for OAuth — not just Claude Code clients.
+                                const shouldPolyfillBody = isOAuth;
+                                const buildUpstreamBody = (token) => shouldPolyfillBody
+                                    ? polyfillOAuthBody(bodyStr, token, snapshot, headers["x-claude-code-session-id"])
+                                    : { bodyStr };
+                                const polyfilledBody = buildUpstreamBody(account.token);
+                                if (isOAuth && polyfilledBody.sessionId && !headers["x-claude-code-session-id"]) {
+                                    headers["x-claude-code-session-id"] = polyfilledBody.sessionId;
+                                }
+                                const finalBodyStr = polyfilledBody.bodyStr;
                                 logger.always(`[proxy] → account=${account.label} (${account.type})`);
-                                recordRequest(account.label, account.type);
+                                recordAttempt(account.label, account.type);
                                 // Log full request for debugging (written to ~/.neurolink/logs/proxy-debug-*.jsonl)
                                 const fetchStartMs = Date.now();
+                                // OTel: start upstream attempt span and inject trace headers
+                                if (tracer) {
+                                    upstreamSpan = tracer.startUpstreamAttempt({
+                                        attempt: attemptNumber,
+                                        account: account.label,
+                                        polyfillHeaders: isOAuth,
+                                        polyfillBody: isOAuth,
+                                        upstreamUrl: url,
+                                    });
+                                    tracer.logUpstreamRequestHeaders(headers);
+                                    tracer.logUpstreamRequestBody(finalBodyStr);
+                                    const traceHeaders = tracer.getTraceHeaders();
+                                    Object.assign(headers, traceHeaders);
+                                }
+                                logProxyBody({
+                                    phase: "upstream_request",
+                                    headers,
+                                    body: finalBodyStr,
+                                    bodySize: Buffer.byteLength(finalBodyStr, "utf8"),
+                                    contentType: headers["content-type"] ?? "application/json",
+                                    account: account.label,
+                                    accountType: account.type,
+                                    attempt: attemptNumber,
+                                });
                                 let response;
                                 try {
                                     response = await fetch(url, {
@@ -638,14 +1302,16 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                     }
                                     // Decision 8: Network errors — immediate rotation, no cooldown
                                     sawNetworkError = true;
-                                    recordError(account.label, account.type, 502);
+                                    recordAttemptError(account.label, account.type, 502);
                                     const errorCode = getErrorCode(fetchErr) ?? "unknown";
-                                    const errorMessage = fetchErr instanceof Error
-                                        ? fetchErr.message
-                                        : String(fetchErr);
+                                    const errorMessage = fetchErr instanceof Error ? fetchErr.message : String(fetchErr);
                                     lastError = errorMessage;
                                     logger.always(`[proxy] fetch error account=${account.label} code=${errorCode} (rotating): ${errorMessage}`);
                                     logAttempt(502, "network_error", errorMessage);
+                                    tracer?.setError("network_error", errorMessage);
+                                    tracer?.recordRetry(account.label, "network_error");
+                                    upstreamSpan?.end();
+                                    upstreamSpan = undefined;
                                     continue;
                                 }
                                 // Check 429 (with Retry-After + exponential backoff) → continue.
@@ -660,7 +1326,6 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                         }
                                         else {
                                             const date = new Date(retryAfter);
-                                            // eslint-disable-next-line max-depth
                                             if (!Number.isNaN(date.getTime())) {
                                                 cooldownMs = Math.max(date.getTime() - Date.now(), 1000);
                                             }
@@ -668,22 +1333,24 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                     }
                                     const level = accountState.backoffLevel;
                                     const baseCooldown = cooldownMs > 0 ? cooldownMs : RATE_LIMIT_BACKOFF_BASE_MS;
-                                    const backoffMs = Math.min(baseCooldown * Math.pow(2, level), RATE_LIMIT_BACKOFF_CAP_MS);
+                                    const backoffMs = Math.min(baseCooldown * 2 ** level, RATE_LIMIT_BACKOFF_CAP_MS);
                                     accountState.coolingUntil = Date.now() + backoffMs;
                                     accountState.backoffLevel += 1;
                                     advancePrimaryIfCurrent(account.key, enabledAccounts.length, orderedAccounts[0]?.key);
-                                    recordError(account.label, account.type, 429);
+                                    recordAttemptError(account.label, account.type, 429);
                                     recordCooldown(account.label, account.type, accountState.coolingUntil, accountState.backoffLevel);
                                     lastError = await response.text();
                                     logger.always(`[proxy] ← 429 account=${account.label} backoff-level=${accountState.backoffLevel} cooldown=${Math.round(backoffMs / 1000)}s`);
                                     logAttempt(429, "rate_limit_error", String(lastError));
+                                    tracer?.setError("rate_limit_error", String(lastError).slice(0, 500));
+                                    tracer?.recordRetry(account.label, "rate_limit");
+                                    upstreamSpan?.end();
+                                    upstreamSpan = undefined;
                                     continue;
                                 }
                                 // On 401 for refreshable OAuth: refresh token and retry before failing over.
-                                if (response.status === 401 &&
-                                    account.type === "oauth" &&
-                                    account.refreshToken) {
-                                    recordError(account.label, account.type, 401);
+                                if (response.status === 401 && account.type === "oauth" && account.refreshToken) {
+                                    recordAttemptError(account.label, account.type, 401);
                                     let authRetrySucceeded = false;
                                     let authRetryError = "received 401 from Anthropic";
                                     for (let authRetry = 0; authRetry < MAX_AUTH_RETRIES; authRetry++) {
@@ -694,14 +1361,11 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                             authRetryError = `refresh failed for account=${account.label} attempt ${authRetry + 1}/${MAX_AUTH_RETRIES}: ${refreshSucceeded.error?.slice(0, 200) ?? "unknown"}`;
                                             lastError = authRetryError;
                                             logger.always(`[proxy] ⚠ account=${account.label} refresh failed on attempt ${authRetry + 1}`);
-                                            // eslint-disable-next-line max-depth
-                                            if (accountState.consecutiveRefreshFailures >=
-                                                MAX_CONSECUTIVE_REFRESH_FAILURES) {
+                                            if (accountState.consecutiveRefreshFailures >= MAX_CONSECUTIVE_REFRESH_FAILURES) {
                                                 await disableAccountUntilReauth(account, accountState);
                                                 authFailureMessage = formatReauthMessage(account.label);
                                                 break;
                                             }
-                                            // eslint-disable-next-line max-depth
                                             if (authRetry < MAX_AUTH_RETRIES - 1) {
                                                 await sleep(2000);
                                             }
@@ -715,27 +1379,24 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                             const retryResp = await fetch(url, {
                                                 method: "POST",
                                                 headers,
-                                                body: buildUpstreamBody(),
+                                                body: buildUpstreamBody(account.token).bodyStr,
                                                 signal: AbortSignal.timeout(UPSTREAM_FETCH_TIMEOUT_MS),
                                             });
-                                            // eslint-disable-next-line max-depth
                                             if (retryResp.ok) {
                                                 authRetrySucceeded = true;
                                                 accountState.consecutiveRefreshFailures = 0;
                                                 accountState.backoffLevel = 0;
                                                 accountState.coolingUntil = undefined;
                                                 logger.always(`[proxy] ← 200 account=${account.label} (after ${authRetry + 1} refresh(es))`);
-                                                recordSuccess(account.label, account.type);
-                                                logAttempt(retryResp.status);
+                                                // Final success is recorded only once the response path
+                                                // that reaches the client is fully determined.
                                                 // Capture quota headers after successful auth-retry
                                                 {
                                                     const retryQuota = parseQuotaHeaders(retryResp.headers);
-                                                    // eslint-disable-next-line max-depth
                                                     if (retryQuota) {
                                                         saveAccountQuota(account.label, retryQuota).catch(() => { });
                                                     }
                                                 }
-                                                // eslint-disable-next-line max-depth
                                                 if (body.stream && retryResp.body) {
                                                     const retryReader = retryResp.body.getReader();
                                                     let retryStreamClosed = false;
@@ -757,9 +1418,7 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                                                 controller.enqueue(value);
                                                             }
                                                             catch (streamErr) {
-                                                                const errMsg = streamErr instanceof Error
-                                                                    ? streamErr.message
-                                                                    : String(streamErr);
+                                                                const errMsg = streamErr instanceof Error ? streamErr.message : String(streamErr);
                                                                 logger.always(`[proxy] mid-stream error (auth-retry) account=${account.label}: ${errMsg}`);
                                                                 logStreamError({
                                                                     timestamp: new Date().toISOString(),
@@ -782,12 +1441,57 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                                             retryReader.cancel();
                                                         },
                                                     });
+                                                    // OTel: pipe auth-retry stream through SSE interceptor
+                                                    let retryClientStream = retryStream;
+                                                    if (tracer) {
+                                                        try {
+                                                            const { stream: retryInterceptor, telemetry: retryTelemetry } = createSSEInterceptor();
+                                                            retryClientStream = retryStream.pipeThrough(retryInterceptor);
+                                                            const capturedTracer2 = tracer;
+                                                            const capturedUpstreamSpan2 = upstreamSpan;
+                                                            const capturedRetryResp = retryResp;
+                                                            const capturedRetryRequestBytes = finalBodyStr.length;
+                                                            const capturedAccountLabel2 = account.label;
+                                                            retryTelemetry
+                                                                .then((data) => {
+                                                                capturedTracer2.setUsage({
+                                                                    inputTokens: data.usage.inputTokens,
+                                                                    outputTokens: data.usage.outputTokens,
+                                                                    cacheCreationTokens: data.usage.cacheCreationInputTokens,
+                                                                    cacheReadTokens: data.usage.cacheReadInputTokens,
+                                                                });
+                                                                capturedTracer2.logStreamEvents(data.events);
+                                                                capturedTracer2.logUpstreamResponseHeaders(Object.fromEntries([...capturedRetryResp.headers.entries()]));
+                                                                capturedTracer2.recordMetrics();
+                                                                capturedTracer2.recordBodySizes(capturedRetryRequestBytes, data.totalBytesReceived);
+                                                                capturedUpstreamSpan2?.end();
+                                                                capturedTracer2.end(200, Date.now() - requestStartTime);
+                                                                recordFinalSuccess(capturedAccountLabel2, account.type);
+                                                                // Deferred JSONL log with token usage (auth-retry streaming)
+                                                                logFinalRequest(200, capturedAccountLabel2, account.type, undefined, undefined, {
+                                                                    inputTokens: data.usage.inputTokens,
+                                                                    outputTokens: data.usage.outputTokens,
+                                                                    cacheCreationTokens: data.usage.cacheCreationInputTokens,
+                                                                    cacheReadTokens: data.usage.cacheReadInputTokens,
+                                                                });
+                                                            })
+                                                                .catch((err) => {
+                                                                capturedTracer2.setError("stream_error", err instanceof Error ? err.message : String(err));
+                                                                capturedUpstreamSpan2?.end();
+                                                                capturedTracer2.end(500, Date.now() - requestStartTime);
+                                                                recordFinalError(500, capturedAccountLabel2, account.type);
+                                                                logFinalRequest(500, capturedAccountLabel2, account.type, "stream_error", err instanceof Error ? err.message : String(err));
+                                                            });
+                                                        }
+                                                        catch {
+                                                            retryClientStream = retryStream;
+                                                        }
+                                                    }
                                                     const responseHeaders = {
                                                         "content-type": "text/event-stream",
                                                         "cache-control": "no-cache",
                                                         connection: "keep-alive",
                                                     };
-                                                    // eslint-disable-next-line max-depth
                                                     for (const h of [
                                                         "retry-after",
                                                         "anthropic-ratelimit-requests-remaining",
@@ -796,25 +1500,81 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                                         "anthropic-ratelimit-tokens-limit",
                                                     ]) {
                                                         const val = retryResp.headers.get(h);
-                                                        // eslint-disable-next-line max-depth
                                                         if (val) {
                                                             responseHeaders[h] = val;
                                                         }
                                                     }
-                                                    return new Response(retryStream, {
+                                                    return new Response(retryClientStream, {
                                                         status: retryResp.status,
                                                         headers: responseHeaders,
                                                     });
                                                 }
-                                                return retryResp.json();
+                                                // OTel: non-streaming auth-retry success
+                                                const retryRespHeaders = Object.fromEntries([...retryResp.headers.entries()]);
+                                                const retryText = await retryResp.text();
+                                                tracer?.logUpstreamResponseHeaders(retryRespHeaders);
+                                                tracer?.logUpstreamResponseBody(retryText);
+                                                logProxyBody({
+                                                    phase: "upstream_response",
+                                                    headers: retryRespHeaders,
+                                                    body: retryText,
+                                                    bodySize: Buffer.byteLength(retryText, "utf8"),
+                                                    contentType: retryRespHeaders["content-type"] ?? "application/json",
+                                                    account: account.label,
+                                                    accountType: account.type,
+                                                    attempt: attemptNumber,
+                                                    responseStatus: retryResp.status,
+                                                    durationMs: Date.now() - fetchStartMs,
+                                                });
+                                                logProxyBody({
+                                                    phase: "client_response",
+                                                    headers: retryRespHeaders,
+                                                    body: retryText,
+                                                    bodySize: Buffer.byteLength(retryText, "utf8"),
+                                                    contentType: retryRespHeaders["content-type"] ?? "application/json",
+                                                    account: account.label,
+                                                    accountType: account.type,
+                                                    attempt: attemptNumber,
+                                                    responseStatus: retryResp.status,
+                                                    durationMs: Date.now() - requestStartTime,
+                                                });
+                                                const retryJson = JSON.parse(retryText);
+                                                if (tracer && retryJson && typeof retryJson === "object") {
+                                                    const retryUsage = retryJson.usage;
+                                                    if (retryUsage) {
+                                                        tracer.setUsage({
+                                                            inputTokens: retryUsage.input_tokens ?? 0,
+                                                            outputTokens: retryUsage.output_tokens ?? 0,
+                                                            cacheCreationTokens: retryUsage.cache_creation_input_tokens ?? 0,
+                                                            cacheReadTokens: retryUsage.cache_read_input_tokens ?? 0,
+                                                        });
+                                                    }
+                                                    tracer.recordMetrics();
+                                                    const retryJsonStr = JSON.stringify(retryJson);
+                                                    tracer.recordBodySizes(finalBodyStr.length, retryJsonStr.length);
+                                                    upstreamSpan?.end();
+                                                    tracer.end(retryResp.status, Date.now() - requestStartTime);
+                                                    recordFinalSuccess(account.label, account.type);
+                                                    logFinalRequest(retryResp.status, account.label, account.type, undefined, undefined, {
+                                                        inputTokens: retryUsage?.input_tokens,
+                                                        outputTokens: retryUsage?.output_tokens,
+                                                        cacheCreationTokens: retryUsage?.cache_creation_input_tokens,
+                                                        cacheReadTokens: retryUsage?.cache_read_input_tokens,
+                                                    });
+                                                }
+                                                else {
+                                                    upstreamSpan?.end();
+                                                    recordFinalSuccess(account.label, account.type);
+                                                    logFinalRequest(retryResp.status, account.label, account.type);
+                                                }
+                                                return retryJson;
                                             }
                                             const retryStatus = retryResp.status;
                                             const retryBody = await retryResp.text();
                                             authRetryError = `retry ${authRetry + 1}/${MAX_AUTH_RETRIES} failed with status ${retryStatus}`;
                                             lastError = retryBody;
                                             logger.debug(`[proxy] retry ${authRetry + 1} failed: ${retryStatus} ${retryBody.substring(0, 120)}`);
-                                            recordError(account.label, account.type, retryStatus);
-                                            // eslint-disable-next-line max-depth
+                                            recordAttemptError(account.label, account.type, retryStatus);
                                             if (retryStatus === 429) {
                                                 sawRateLimit = true;
                                                 const retryAfter = retryResp.headers.get("retry-after");
@@ -827,38 +1587,33 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                                 recordCooldown(account.label, account.type, accountState.coolingUntil, accountState.backoffLevel);
                                                 break;
                                             }
-                                            // eslint-disable-next-line max-depth
-                                            if (retryStatus === 401 ||
-                                                retryStatus === 402 ||
-                                                retryStatus === 403) {
-                                                // eslint-disable-next-line max-depth
+                                            if (retryStatus === 401 || retryStatus === 402 || retryStatus === 403) {
                                                 if (authRetry < MAX_AUTH_RETRIES - 1) {
                                                     await sleep(1000);
                                                 }
                                                 continue;
                                             }
-                                            // eslint-disable-next-line max-depth
                                             if (isTransientHttpFailure(retryStatus, retryBody)) {
                                                 // Decision 8: No cooldown for transient errors — rotate immediately
                                                 sawTransientFailure = true;
                                                 break;
                                             }
                                             logAttempt(retryStatus, "api_error", summarizeErrorMessage(retryBody));
-                                            // eslint-disable-next-line max-depth
+                                            recordFinalError(retryStatus, account.label, account.type);
                                             try {
+                                                logFinalRequest(retryStatus, account.label, account.type, "api_error", summarizeErrorMessage(retryBody));
                                                 return JSON.parse(retryBody);
                                             }
                                             catch {
+                                                logFinalRequest(retryStatus, account.label, account.type, "api_error", summarizeErrorMessage(retryBody));
                                                 return buildClaudeError(retryStatus, retryBody);
                                             }
                                         }
                                         catch (retryFetchErr) {
                                             // Decision 8: No cooldown for network errors — rotate immediately
                                             sawNetworkError = true;
-                                            recordError(account.label, account.type, 502);
-                                            const message = retryFetchErr instanceof Error
-                                                ? retryFetchErr.message
-                                                : String(retryFetchErr);
+                                            recordAttemptError(account.label, account.type, 502);
+                                            const message = retryFetchErr instanceof Error ? retryFetchErr.message : String(retryFetchErr);
                                             authRetryError = `network error on retry ${authRetry + 1}: ${message}`;
                                             lastError = authRetryError;
                                             logger.debug(`[proxy] ${authRetryError}`);
@@ -866,96 +1621,83 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                         }
                                     }
                                     if (!authRetrySucceeded) {
-                                        // eslint-disable-next-line max-depth
                                         if (!accountState.permanentlyDisabled) {
-                                            // eslint-disable-next-line max-depth
-                                            if (!accountState.coolingUntil ||
-                                                accountState.coolingUntil <= Date.now()) {
-                                                accountState.coolingUntil =
-                                                    Date.now() + AUTH_COOLDOWN_MS;
+                                            if (!accountState.coolingUntil || accountState.coolingUntil <= Date.now()) {
+                                                accountState.coolingUntil = Date.now() + AUTH_COOLDOWN_MS;
                                             }
                                             recordCooldown(account.label, account.type, accountState.coolingUntil, accountState.backoffLevel);
                                         }
                                         lastError = authRetryError;
                                         logger.always(`[proxy] ⚠ account=${account.label} auth retries exhausted, cooldown=5min`);
                                         logAttempt(401, "authentication_error", authRetryError);
+                                        tracer?.setError("authentication_error", authRetryError);
+                                        tracer?.recordRetry(account.label, "auth_exhausted");
+                                        upstreamSpan?.end();
+                                        upstreamSpan = undefined;
                                         continue;
                                     }
                                 }
                                 if (!response.ok) {
                                     const errBody = await response.text();
-                                    // Log full error for debugging
                                     const errRespHeaders = {};
                                     response.headers.forEach((v, k) => {
                                         errRespHeaders[k] = v;
                                     });
-                                    logFullRequestResponse({
-                                        timestamp: new Date().toISOString(),
-                                        requestId: ctx.requestId,
+                                    tracer?.logUpstreamResponseHeaders(errRespHeaders);
+                                    tracer?.logUpstreamResponseBody(errBody);
+                                    logProxyBody({
+                                        phase: "upstream_response",
+                                        headers: errRespHeaders,
+                                        body: errBody,
+                                        bodySize: Buffer.byteLength(errBody, "utf8"),
+                                        contentType: errRespHeaders["content-type"] ?? "application/json",
                                         account: account.label,
-                                        model: body.model,
-                                        stream: !!body.stream,
-                                        requestHeaders: redactSensitiveHeaders(headers),
-                                        requestBody: {
-                                            model: body.model,
-                                            max_tokens: body.max_tokens,
-                                            stream: body.stream,
-                                            system: Array.isArray(body.system)
-                                                ? `[${body.system.length} blocks]`
-                                                : typeof body.system,
-                                            messages: Array.isArray(body.messages)
-                                                ? `[${body.messages.length} messages]`
-                                                : "?",
-                                            tools: Array.isArray(body.tools)
-                                                ? `[${body.tools.length} tools]`
-                                                : "none",
-                                            tool_choice: body.tool_choice,
-                                            thinking: body.thinking,
-                                        },
-                                        requestBodySize: bodyStr.length,
+                                        accountType: account.type,
+                                        attempt: attemptNumber,
                                         responseStatus: response.status,
-                                        responseHeaders: errRespHeaders,
-                                        responseBody: errBody.substring(0, 2000),
-                                        responseBodySize: errBody.length,
                                         durationMs: Date.now() - fetchStartMs,
                                     });
-                                    // Request-shape errors (do not retry).
+                                    // Upstream invalid_request_error responses are not retried on the
+                                    // same Anthropic account, but may still be handed to fallback providers.
                                     if (isInvalidRequestError(response.status, errBody)) {
-                                        logger.always(`[proxy] ← ${response.status} request-shape error (no retry)`);
+                                        logger.always(`[proxy] ← ${response.status} upstream invalid_request_error`);
                                         logAttempt(response.status, "invalid_request_error", summarizeErrorMessage(errBody));
-                                        try {
-                                            return JSON.parse(errBody);
-                                        }
-                                        catch {
-                                            return buildClaudeError(response.status, errBody);
-                                        }
+                                        tracer?.setError("invalid_request_error", summarizeErrorMessage(errBody));
+                                        invalidRequestFailure = {
+                                            status: response.status,
+                                            body: errBody,
+                                            contentType: errRespHeaders["content-type"],
+                                        };
+                                        lastError = summarizeErrorMessage(errBody);
+                                        upstreamSpan?.end();
+                                        upstreamSpan = undefined;
+                                        break;
                                     }
                                     // Auth failures for OAuth accounts without refresh token.
-                                    if ((response.status === 401 ||
-                                        response.status === 402 ||
-                                        response.status === 403) &&
+                                    if ((response.status === 401 || response.status === 402 || response.status === 403) &&
                                         account.type === "oauth" &&
                                         !account.refreshToken) {
-                                        recordError(account.label, account.type, response.status);
+                                        recordAttemptError(account.label, account.type, response.status);
                                         accountState.consecutiveRefreshFailures += 1;
                                         accountState.coolingUntil = Date.now() + AUTH_COOLDOWN_MS;
                                         recordCooldown(account.label, account.type, accountState.coolingUntil, accountState.backoffLevel);
-                                        if (accountState.consecutiveRefreshFailures >=
-                                            MAX_CONSECUTIVE_REFRESH_FAILURES) {
+                                        if (accountState.consecutiveRefreshFailures >= MAX_CONSECUTIVE_REFRESH_FAILURES) {
                                             await disableAccountUntilReauth(account, accountState);
                                         }
                                         authFailureMessage = formatReauthMessage(account.label);
                                         logger.always(`[proxy] ← ${response.status} account=${account.label} cooldown=5min`);
                                         lastError = errBody;
                                         logAttempt(response.status, "authentication_error", summarizeErrorMessage(errBody));
+                                        tracer?.setError("authentication_error", summarizeErrorMessage(errBody));
+                                        tracer?.recordRetry(account.label, "auth_no_refresh");
+                                        upstreamSpan?.end();
+                                        upstreamSpan = undefined;
                                         continue;
                                     }
                                     // Auth failures for API-key accounts.
-                                    if ((response.status === 401 ||
-                                        response.status === 402 ||
-                                        response.status === 403) &&
+                                    if ((response.status === 401 || response.status === 402 || response.status === 403) &&
                                         account.type === "api_key") {
-                                        recordError(account.label, account.type, response.status);
+                                        recordAttemptError(account.label, account.type, response.status);
                                         authFailureMessage =
                                             "Authentication failed for Anthropic API key credentials. Update ANTHROPIC_API_KEY or re-login with OAuth.";
                                         accountState.coolingUntil = Date.now() + AUTH_COOLDOWN_MS;
@@ -963,49 +1705,126 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                         logger.always(`[proxy] ← ${response.status} account=${account.label} cooldown=5min`);
                                         lastError = errBody;
                                         logAttempt(response.status, "authentication_error", summarizeErrorMessage(errBody));
+                                        tracer?.setError("authentication_error", summarizeErrorMessage(errBody));
+                                        tracer?.recordRetry(account.label, "auth_api_key");
+                                        upstreamSpan?.end();
+                                        upstreamSpan = undefined;
                                         continue;
                                     }
                                     // 404 is generally model/account specific; return immediately (no cooldown per Decision 8).
                                     if (response.status === 404) {
-                                        recordError(account.label, account.type, response.status);
+                                        recordFinalError(response.status, account.label, account.type);
                                         logger.always(`[proxy] ← 404 account=${account.label}`);
                                         logAttempt(404, "not_found_error", summarizeErrorMessage(errBody));
+                                        tracer?.setError("not_found_error", summarizeErrorMessage(errBody));
+                                        upstreamSpan?.end();
+                                        tracer?.end(404, Date.now() - requestStartTime);
                                         try {
-                                            return JSON.parse(errBody);
+                                            const parsedError = JSON.parse(errBody);
+                                            logFinalRequest(404, account.label, account.type, "not_found_error", summarizeErrorMessage(errBody));
+                                            logProxyBody({
+                                                phase: "client_response",
+                                                headers: {
+                                                    "content-type": errRespHeaders["content-type"] ?? "application/json",
+                                                },
+                                                body: errBody,
+                                                bodySize: Buffer.byteLength(errBody, "utf8"),
+                                                contentType: errRespHeaders["content-type"] ?? "application/json",
+                                                account: account.label,
+                                                accountType: account.type,
+                                                attempt: attemptNumber,
+                                                responseStatus: 404,
+                                                durationMs: Date.now() - requestStartTime,
+                                            });
+                                            return parsedError;
                                         }
                                         catch {
-                                            return buildClaudeError(404, errBody);
+                                            logFinalRequest(404, account.label, account.type, "not_found_error", summarizeErrorMessage(errBody));
+                                            const clientError = buildClaudeError(404, errBody);
+                                            const clientErrorBody = JSON.stringify(clientError);
+                                            logProxyBody({
+                                                phase: "client_response",
+                                                headers: { "content-type": "application/json" },
+                                                body: clientErrorBody,
+                                                bodySize: Buffer.byteLength(clientErrorBody, "utf8"),
+                                                contentType: "application/json",
+                                                account: account.label,
+                                                accountType: account.type,
+                                                attempt: attemptNumber,
+                                                responseStatus: 404,
+                                                durationMs: Date.now() - requestStartTime,
+                                            });
+                                            return clientError;
                                         }
                                     }
                                     // Decision 8: Transient upstream failures — immediate rotation, NO cooldown.
                                     if (isTransientHttpFailure(response.status, errBody)) {
-                                        recordError(account.label, account.type, response.status);
+                                        recordAttemptError(account.label, account.type, response.status);
                                         sawTransientFailure = true;
                                         // No cooldown for transient errors (502, 503, etc.) — rotate immediately
                                         logger.always(`[proxy] ← ${response.status} account=${account.label} (transient, rotating)`);
                                         lastError = errBody;
                                         logAttempt(response.status, "api_error", summarizeErrorMessage(errBody));
+                                        tracer?.setError("transient_error", summarizeErrorMessage(errBody));
+                                        tracer?.recordRetry(account.label, "transient");
+                                        upstreamSpan?.end();
+                                        upstreamSpan = undefined;
                                         continue;
                                     }
                                     // Other non-ok errors → return as-is.
-                                    recordError(account.label, account.type, response.status);
+                                    recordFinalError(response.status, account.label, account.type);
                                     logger.always(`[proxy] ← ${response.status} account=${account.label}`);
                                     logger.debug(`[claude-proxy] error body: ${errBody.substring(0, 200)}`);
                                     logAttempt(response.status, "api_error", summarizeErrorMessage(errBody));
+                                    tracer?.setError("api_error", summarizeErrorMessage(errBody));
+                                    upstreamSpan?.end();
+                                    tracer?.end(response.status, Date.now() - requestStartTime);
                                     try {
-                                        return JSON.parse(errBody);
+                                        const parsedError = JSON.parse(errBody);
+                                        logFinalRequest(response.status, account.label, account.type, "api_error", summarizeErrorMessage(errBody));
+                                        logProxyBody({
+                                            phase: "client_response",
+                                            headers: {
+                                                "content-type": errRespHeaders["content-type"] ?? "application/json",
+                                            },
+                                            body: errBody,
+                                            bodySize: Buffer.byteLength(errBody, "utf8"),
+                                            contentType: errRespHeaders["content-type"] ?? "application/json",
+                                            account: account.label,
+                                            accountType: account.type,
+                                            attempt: attemptNumber,
+                                            responseStatus: response.status,
+                                            durationMs: Date.now() - requestStartTime,
+                                        });
+                                        return parsedError;
                                     }
                                     catch {
-                                        return buildClaudeError(response.status, errBody);
+                                        logFinalRequest(response.status, account.label, account.type, "api_error", summarizeErrorMessage(errBody));
+                                        const clientError = buildClaudeError(response.status, errBody);
+                                        const clientErrorBody = JSON.stringify(clientError);
+                                        logProxyBody({
+                                            phase: "client_response",
+                                            headers: { "content-type": "application/json" },
+                                            body: clientErrorBody,
+                                            bodySize: Buffer.byteLength(clientErrorBody, "utf8"),
+                                            contentType: "application/json",
+                                            account: account.label,
+                                            accountType: account.type,
+                                            attempt: attemptNumber,
+                                            responseStatus: response.status,
+                                            durationMs: Date.now() - requestStartTime,
+                                        });
+                                        return clientError;
                                     }
                                 }
                                 // Success path.
                                 accountState.backoffLevel = 0;
                                 accountState.coolingUntil = undefined;
                                 accountState.consecutiveRefreshFailures = 0;
-                                recordSuccess(account.label, account.type);
                                 logger.always(`[proxy] ← ${response.status} account=${account.label}`);
-                                logAttempt(response.status);
+                                // NOTE: logAttempt is deferred below so we can include token
+                                // usage.  For streaming, the SSE interceptor callback logs it;
+                                // for non-streaming, we log after JSON parsing.
                                 // Capture quota/utilisation headers (fire-and-forget).
                                 const quota = parseQuotaHeaders(response.headers);
                                 if (quota) {
@@ -1013,53 +1832,25 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                         // Non-fatal: quota persistence is best-effort
                                     });
                                 }
-                                // Log full request + response headers for debugging
                                 const respHeaders = {};
                                 response.headers.forEach((v, k) => {
                                     respHeaders[k] = v;
                                 });
-                                logFullRequestResponse({
-                                    timestamp: new Date().toISOString(),
-                                    requestId: ctx.requestId,
-                                    account: account.label,
-                                    model: body.model,
-                                    stream: !!body.stream,
-                                    requestHeaders: redactSensitiveHeaders(headers),
-                                    requestBody: {
-                                        model: body.model,
-                                        max_tokens: body.max_tokens,
-                                        stream: body.stream,
-                                        system: Array.isArray(body.system)
-                                            ? `[${body.system.length} blocks]`
-                                            : typeof body.system,
-                                        messages: Array.isArray(body.messages)
-                                            ? `[${body.messages.length} messages]`
-                                            : "?",
-                                        tools: Array.isArray(body.tools)
-                                            ? `[${body.tools.length} tools]`
-                                            : "none",
-                                        tool_choice: body.tool_choice,
-                                        thinking: body.thinking,
-                                        metadata: body.metadata ? "present" : "absent",
-                                    },
-                                    requestBodySize: bodyStr.length,
-                                    responseStatus: response.status,
-                                    responseHeaders: respHeaders,
-                                    durationMs: Date.now() - fetchStartMs,
-                                });
+                                tracer?.logUpstreamResponseHeaders(respHeaders);
                                 if (body.stream) {
                                     // Bootstrap retry: read first chunk to verify stream is valid.
                                     if (response.body) {
                                         const reader = response.body.getReader();
                                         const firstChunk = await reader.read();
-                                        if (firstChunk.done ||
-                                            !firstChunk.value ||
-                                            firstChunk.value.length === 0) {
+                                        if (firstChunk.done || !firstChunk.value || firstChunk.value.length === 0) {
                                             // Empty stream — retry with next account.
                                             reader.cancel();
                                             accountState.coolingUntil = Date.now() + 10_000;
                                             recordCooldown(account.label, account.type, accountState.coolingUntil, accountState.backoffLevel);
                                             logger.always(`[proxy] ← empty stream from account=${account.label}, trying next`);
+                                            tracer?.recordRetry(account.label, "empty_stream");
+                                            upstreamSpan?.end();
+                                            upstreamSpan = undefined;
                                             continue;
                                         }
                                         // Stream is valid — create a new ReadableStream with first chunk prepended.
@@ -1085,9 +1876,7 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                                     controller.enqueue(value);
                                                 }
                                                 catch (streamErr) {
-                                                    const errMsg = streamErr instanceof Error
-                                                        ? streamErr.message
-                                                        : String(streamErr);
+                                                    const errMsg = streamErr instanceof Error ? streamErr.message : String(streamErr);
                                                     logger.always(`[proxy] mid-stream error account=${account.label}: ${errMsg}`);
                                                     logStreamError({
                                                         timestamp: new Date().toISOString(),
@@ -1112,6 +1901,175 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                                 reader.cancel();
                                             },
                                         });
+                                        // OTel: pipe stream through SSE interceptor for telemetry extraction.
+                                        // The interceptor passes all bytes through unmodified and resolves
+                                        // its telemetry promise when the stream finishes.
+                                        const { stream: clientCaptureStream, capture: clientCapture } = createRawStreamCapture();
+                                        let streamSource = remainingStream;
+                                        if (tracer) {
+                                            try {
+                                                const { stream: interceptor, telemetry } = createSSEInterceptor({ captureRawText: true });
+                                                streamSource = streamSource.pipeThrough(interceptor);
+                                                // Capture refs in const variables for the async closure —
+                                                // loop variables (upstreamSpan, response) will change on next iteration,
+                                                // and TypeScript needs the narrowed type for tracer.
+                                                const capturedTracer = tracer;
+                                                const capturedUpstreamSpan = upstreamSpan;
+                                                const capturedResponse = response;
+                                                const capturedRequestBytes = finalBodyStr.length;
+                                                const capturedAccountLabel = account.label;
+                                                Promise.all([telemetry, clientCapture])
+                                                    .then(([data, clientBody]) => {
+                                                    capturedTracer.setUsage({
+                                                        inputTokens: data.usage.inputTokens,
+                                                        outputTokens: data.usage.outputTokens,
+                                                        cacheCreationTokens: data.usage.cacheCreationInputTokens,
+                                                        cacheReadTokens: data.usage.cacheReadInputTokens,
+                                                    });
+                                                    capturedTracer.logStreamEvents(data.events);
+                                                    // Extract rate limits from response headers
+                                                    const rateLimit5h = parseFloat(capturedResponse.headers.get("anthropic-ratelimit-unified-5h-utilization") ?? "");
+                                                    const rateLimit7d = parseFloat(capturedResponse.headers.get("anthropic-ratelimit-unified-7d-utilization") ?? "");
+                                                    const usageUpdate = {
+                                                        inputTokens: data.usage.inputTokens,
+                                                        outputTokens: data.usage.outputTokens,
+                                                        cacheCreationTokens: data.usage.cacheCreationInputTokens,
+                                                        cacheReadTokens: data.usage.cacheReadInputTokens,
+                                                    };
+                                                    if (!isNaN(rateLimit5h)) {
+                                                        usageUpdate.rateLimitAfter5h = rateLimit5h;
+                                                    }
+                                                    if (!isNaN(rateLimit7d)) {
+                                                        usageUpdate.rateLimitAfter7d = rateLimit7d;
+                                                    }
+                                                    if (!isNaN(rateLimit5h) || !isNaN(rateLimit7d)) {
+                                                        capturedTracer.setUsage(usageUpdate);
+                                                    }
+                                                    capturedTracer.logUpstreamResponseBody(data.rawText ?? "");
+                                                    capturedTracer.recordMetrics();
+                                                    capturedTracer.recordBodySizes(capturedRequestBytes, data.totalBytesReceived);
+                                                    capturedUpstreamSpan?.end();
+                                                    capturedTracer.end(200, Date.now() - requestStartTime);
+                                                    recordFinalSuccess(capturedAccountLabel, account.type);
+                                                    // Deferred JSONL log with token usage + traceId
+                                                    // (streaming: tokens only available after SSE stream finishes)
+                                                    logFinalRequest(200, capturedAccountLabel, account.type, undefined, undefined, {
+                                                        inputTokens: data.usage.inputTokens,
+                                                        outputTokens: data.usage.outputTokens,
+                                                        cacheCreationTokens: data.usage.cacheCreationInputTokens,
+                                                        cacheReadTokens: data.usage.cacheReadInputTokens,
+                                                    });
+                                                    logProxyBody({
+                                                        phase: "upstream_response",
+                                                        headers: respHeaders,
+                                                        body: data.rawText ?? "",
+                                                        bodySize: data.totalBytesReceived,
+                                                        contentType: respHeaders["content-type"] ?? "text/event-stream",
+                                                        account: capturedAccountLabel,
+                                                        accountType: account.type,
+                                                        attempt: attemptNumber,
+                                                        responseStatus: 200,
+                                                        durationMs: Date.now() - requestStartTime,
+                                                    });
+                                                    logProxyBody({
+                                                        phase: "client_response",
+                                                        headers: responseHeaders,
+                                                        body: clientBody.text,
+                                                        bodySize: clientBody.totalBytes,
+                                                        contentType: responseHeaders["content-type"] ?? "text/event-stream",
+                                                        account: capturedAccountLabel,
+                                                        accountType: account.type,
+                                                        attempt: attemptNumber,
+                                                        responseStatus: 200,
+                                                        durationMs: Date.now() - requestStartTime,
+                                                    });
+                                                })
+                                                    .catch((err) => {
+                                                    capturedTracer.setError("stream_error", err instanceof Error ? err.message : String(err));
+                                                    capturedUpstreamSpan?.end();
+                                                    capturedTracer.end(500, Date.now() - requestStartTime);
+                                                    recordFinalError(500, capturedAccountLabel, account.type);
+                                                    // Log the streaming error in JSONL
+                                                    logFinalRequest(500, capturedAccountLabel, account.type, "stream_error", err instanceof Error ? err.message : String(err));
+                                                });
+                                            }
+                                            catch {
+                                                // Interceptor attachment failed after stream setup; response handling continues.
+                                            }
+                                        }
+                                        else {
+                                            // No tracer — still intercept stream for JSONL token logging
+                                            upstreamSpan?.end();
+                                            try {
+                                                const { stream: noTracerInterceptor, telemetry: noTracerTelemetry } = createSSEInterceptor({
+                                                    captureRawText: true,
+                                                });
+                                                streamSource = streamSource.pipeThrough(noTracerInterceptor);
+                                                const capturedAccountLabel = account.label;
+                                                Promise.all([noTracerTelemetry, clientCapture])
+                                                    .then(([data, clientBody]) => {
+                                                    recordFinalSuccess(capturedAccountLabel, account.type);
+                                                    logFinalRequest(200, capturedAccountLabel, account.type, undefined, undefined, {
+                                                        inputTokens: data.usage.inputTokens,
+                                                        outputTokens: data.usage.outputTokens,
+                                                        cacheCreationTokens: data.usage.cacheCreationInputTokens,
+                                                        cacheReadTokens: data.usage.cacheReadInputTokens,
+                                                    });
+                                                    logProxyBody({
+                                                        phase: "upstream_response",
+                                                        headers: respHeaders,
+                                                        body: data.rawText ?? "",
+                                                        bodySize: data.totalBytesReceived,
+                                                        contentType: respHeaders["content-type"] ?? "text/event-stream",
+                                                        account: capturedAccountLabel,
+                                                        accountType: account.type,
+                                                        attempt: attemptNumber,
+                                                        responseStatus: 200,
+                                                        durationMs: Date.now() - requestStartTime,
+                                                    });
+                                                    logProxyBody({
+                                                        phase: "client_response",
+                                                        headers: responseHeaders,
+                                                        body: clientBody.text,
+                                                        bodySize: clientBody.totalBytes,
+                                                        contentType: responseHeaders["content-type"] ?? "text/event-stream",
+                                                        account: capturedAccountLabel,
+                                                        accountType: account.type,
+                                                        attempt: attemptNumber,
+                                                        responseStatus: 200,
+                                                        durationMs: Date.now() - requestStartTime,
+                                                    });
+                                                })
+                                                    .catch(() => {
+                                                    recordFinalSuccess(account.label, account.type);
+                                                    logFinalRequest(response.status, account.label, account.type);
+                                                });
+                                            }
+                                            catch {
+                                                // SSE interceptor creation failed — log without tokens
+                                                clientCapture
+                                                    .then((clientBody) => {
+                                                    logProxyBody({
+                                                        phase: "client_response",
+                                                        headers: responseHeaders,
+                                                        body: clientBody.text,
+                                                        bodySize: clientBody.totalBytes,
+                                                        contentType: responseHeaders["content-type"] ?? "text/event-stream",
+                                                        account: account.label,
+                                                        accountType: account.type,
+                                                        attempt: attemptNumber,
+                                                        responseStatus: 200,
+                                                        durationMs: Date.now() - requestStartTime,
+                                                    });
+                                                })
+                                                    .catch(() => {
+                                                    // Non-fatal
+                                                });
+                                                recordFinalSuccess(account.label, account.type);
+                                                logFinalRequest(response.status, account.label, account.type);
+                                            }
+                                        }
+                                        const clientStream = streamSource.pipeThrough(clientCaptureStream);
                                         // Forward rate limit headers from Anthropic.
                                         const responseHeaders = {
                                             "content-type": "text/event-stream",
@@ -1126,20 +2084,124 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                             "anthropic-ratelimit-tokens-limit",
                                         ]) {
                                             const val = response.headers.get(h);
-                                            // eslint-disable-next-line max-depth
                                             if (val) {
                                                 responseHeaders[h] = val;
                                             }
                                         }
-                                        return new Response(remainingStream, {
+                                        return new Response(clientStream, {
                                             status: response.status,
                                             headers: responseHeaders,
                                         });
                                     }
-                                    return buildClaudeError(502, "No response body from upstream");
+                                    upstreamSpan?.end();
+                                    tracer?.setError("stream_error", "No response body from upstream");
+                                    tracer?.end(502, Date.now() - requestStartTime);
+                                    recordFinalError(502, account.label, account.type);
+                                    logFinalRequest(502, account.label, account.type, "stream_error", "No response body from upstream");
+                                    const clientError = buildClaudeError(502, "No response body from upstream");
+                                    logProxyBody({
+                                        phase: "client_response",
+                                        headers: { "content-type": "application/json" },
+                                        body: JSON.stringify(clientError),
+                                        bodySize: Buffer.byteLength(JSON.stringify(clientError), "utf8"),
+                                        contentType: "application/json",
+                                        account: account.label,
+                                        accountType: account.type,
+                                        attempt: attemptNumber,
+                                        responseStatus: 502,
+                                        durationMs: Date.now() - requestStartTime,
+                                    });
+                                    return clientError;
                                 }
                                 // Non-streaming: return JSON directly.
-                                return response.json();
+                                // OTel: extract usage from response JSON before returning.
+                                const responseText = await response.text();
+                                tracer?.logUpstreamResponseBody(responseText);
+                                logProxyBody({
+                                    phase: "upstream_response",
+                                    headers: respHeaders,
+                                    body: responseText,
+                                    bodySize: Buffer.byteLength(responseText, "utf8"),
+                                    contentType: respHeaders["content-type"] ?? "application/json",
+                                    account: account.label,
+                                    accountType: account.type,
+                                    attempt: attemptNumber,
+                                    responseStatus: response.status,
+                                    durationMs: Date.now() - fetchStartMs,
+                                });
+                                logProxyBody({
+                                    phase: "client_response",
+                                    headers: respHeaders,
+                                    body: responseText,
+                                    bodySize: Buffer.byteLength(responseText, "utf8"),
+                                    contentType: respHeaders["content-type"] ?? "application/json",
+                                    account: account.label,
+                                    accountType: account.type,
+                                    attempt: attemptNumber,
+                                    responseStatus: response.status,
+                                    durationMs: Date.now() - requestStartTime,
+                                });
+                                const responseJson = JSON.parse(responseText);
+                                if (tracer && responseJson && typeof responseJson === "object") {
+                                    const usage = responseJson.usage;
+                                    if (usage) {
+                                        tracer.setUsage({
+                                            inputTokens: usage.input_tokens ?? 0,
+                                            outputTokens: usage.output_tokens ?? 0,
+                                            cacheCreationTokens: usage.cache_creation_input_tokens ?? 0,
+                                            cacheReadTokens: usage.cache_read_input_tokens ?? 0,
+                                        });
+                                        // Extract rate limits from response headers
+                                        const rateLimit5h = parseFloat(response.headers.get("anthropic-ratelimit-unified-5h-utilization") ?? "");
+                                        const rateLimit7d = parseFloat(response.headers.get("anthropic-ratelimit-unified-7d-utilization") ?? "");
+                                        if (!isNaN(rateLimit5h) || !isNaN(rateLimit7d)) {
+                                            const usageWithRates = {
+                                                inputTokens: usage.input_tokens ?? 0,
+                                                outputTokens: usage.output_tokens ?? 0,
+                                                cacheCreationTokens: usage.cache_creation_input_tokens ?? 0,
+                                                cacheReadTokens: usage.cache_read_input_tokens ?? 0,
+                                            };
+                                            if (!isNaN(rateLimit5h)) {
+                                                usageWithRates.rateLimitAfter5h = rateLimit5h;
+                                            }
+                                            if (!isNaN(rateLimit7d)) {
+                                                usageWithRates.rateLimitAfter7d = rateLimit7d;
+                                            }
+                                            tracer.setUsage(usageWithRates);
+                                        }
+                                    }
+                                    tracer.recordMetrics();
+                                    const responseJsonStr = JSON.stringify(responseJson);
+                                    tracer.recordBodySizes(finalBodyStr.length, responseJsonStr.length);
+                                    upstreamSpan?.end();
+                                    tracer.end(response.status, Date.now() - requestStartTime);
+                                    recordFinalSuccess(account.label, account.type);
+                                    logFinalRequest(response.status, account.label, account.type, undefined, undefined, {
+                                        inputTokens: usage?.input_tokens,
+                                        outputTokens: usage?.output_tokens,
+                                        cacheCreationTokens: usage?.cache_creation_input_tokens,
+                                        cacheReadTokens: usage?.cache_read_input_tokens,
+                                    });
+                                }
+                                else {
+                                    upstreamSpan?.end();
+                                    // No tracer — still extract usage from response JSON for JSONL logging
+                                    const noTracerUsage = responseJson && typeof responseJson === "object"
+                                        ? responseJson.usage
+                                        : undefined;
+                                    recordFinalSuccess(account.label, account.type);
+                                    logFinalRequest(response.status, account.label, account.type, undefined, undefined, {
+                                        inputTokens: noTracerUsage?.input_tokens,
+                                        outputTokens: noTracerUsage?.output_tokens,
+                                        cacheCreationTokens: noTracerUsage?.cache_creation_input_tokens,
+                                        cacheReadTokens: noTracerUsage?.cache_read_input_tokens,
+                                    });
+                                }
+                                return responseJson;
+                            }
+                            // OTel: end account selection span if all accounts were skipped
+                            if (attemptNumber === 0) {
+                                acctSelectionSpan?.end();
                             }
                             // All accounts exhausted — compute earliest recovery time.
                             const earliestRecovery = orderedAccounts.reduce((min, account) => {
@@ -1152,42 +2214,18 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                             // Try fallback chain (alternative providers)
                             const chain = modelRouter?.getFallbackChain() ?? [];
                             for (const fallback of chain) {
+                                const availability = await ProviderHealthChecker.checkFallbackProviderAvailability(fallback.provider, fallback.model);
+                                if (!availability.available) {
+                                    logger.debug(`[proxy] skipping fallback ${fallback.provider}/${fallback.model}: ${availability.reason ?? "provider unavailable"}`);
+                                    continue;
+                                }
                                 try {
                                     logger.always(`[proxy] fallback → ${fallback.provider}/${fallback.model}`);
                                     const parsed = parseClaudeRequest(body);
-                                    const opts = {
-                                        input: {
-                                            text: parsed.prompt,
-                                            ...(parsed.images.length > 0
-                                                ? { images: parsed.images }
-                                                : {}),
-                                        },
+                                    const opts = buildProxyFallbackOptions(parsed, {
                                         provider: fallback.provider,
                                         model: fallback.model,
-                                        systemPrompt: parsed.systemPrompt,
-                                        maxTokens: parsed.maxTokens,
-                                        ...(parsed.temperature !== undefined
-                                            ? { temperature: parsed.temperature }
-                                            : {}),
-                                        ...(parsed.topP !== undefined ? { topP: parsed.topP } : {}),
-                                        ...(parsed.topK !== undefined ? { topK: parsed.topK } : {}),
-                                        ...(parsed.stopSequences?.length
-                                            ? { stopSequences: parsed.stopSequences }
-                                            : {}),
-                                        tools: parsed.tools,
-                                        ...(parsed.toolChoice
-                                            ? { toolChoice: parsed.toolChoice }
-                                            : {}),
-                                        ...(parsed.thinkingConfig
-                                            ? { thinkingConfig: parsed.thinkingConfig }
-                                            : {}),
-                                        ...(parsed.conversationMessages?.length
-                                            ? {
-                                                conversationMessages: parsed.conversationMessages.slice(0, -1),
-                                            }
-                                            : {}),
-                                        maxSteps: 1,
-                                    };
+                                    });
                                     if (body.stream) {
                                         const streamResult = await ctx.neurolink.stream(opts);
                                         const serializer = new ClaudeStreamSerializer(body.model, 0);
@@ -1195,33 +2233,38 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                             for (const frame of serializer.start()) {
                                                 yield frame;
                                             }
+                                            let collectedText = "";
                                             for await (const chunk of streamResult.stream) {
                                                 const text = extractText(chunk);
                                                 if (text) {
+                                                    collectedText += text;
                                                     for (const frame of serializer.pushDelta(text)) {
                                                         yield frame;
                                                     }
                                                 }
                                             }
                                             // Emit tool_use blocks if model wants to call tools
-                                            if (streamResult.toolCalls?.length) {
-                                                for (const tc of streamResult.toolCalls) {
-                                                    const toolName = tc.toolName ??
-                                                        tc.name ??
-                                                        "unknown";
-                                                    const toolArgs = tc.args ??
-                                                        tc.parameters ??
-                                                        {};
-                                                    for (const frame of serializer.pushToolUse(generateToolUseId(), toolName, toolArgs)) {
+                                            const toolCalls = streamResult.toolCalls ?? [];
+                                            if (!hasTranslatedOutput(collectedText, toolCalls)) {
+                                                throw new Error(`Translated provider ${fallback.provider}/${fallback.model} returned no content or tool calls`);
+                                            }
+                                            if (toolCalls.length) {
+                                                for (const tc of toolCalls) {
+                                                    const toolName = tc.toolName ?? tc.name ?? "unknown";
+                                                    for (const frame of serializer.pushToolUse(generateToolUseId(), toolName, extractToolArgs(tc))) {
                                                         yield frame;
                                                     }
                                                 }
                                             }
                                             const reason = streamResult.finishReason ?? "end_turn";
-                                            for (const frame of serializer.finish(0, reason)) {
+                                            const resolvedUsage = extractUsageFromStreamResult(streamResult.usage);
+                                            for (const frame of serializer.finish(resolvedUsage.output, reason)) {
                                                 yield frame;
                                             }
                                         }
+                                        tracer?.end(200, Date.now() - requestStartTime);
+                                        recordFinalSuccess();
+                                        logFinalRequest(200, "", fallback.provider);
                                         return sseGenerator();
                                     }
                                     const streamResult = await ctx.neurolink.stream(opts);
@@ -1232,66 +2275,50 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                             collectedText += text;
                                         }
                                     }
+                                    if (!hasTranslatedOutput(collectedText, streamResult.toolCalls)) {
+                                        throw new Error(`Translated provider ${fallback.provider}/${fallback.model} returned no content or tool calls`);
+                                    }
                                     const internal = {
                                         content: collectedText,
                                         model: streamResult.model,
                                         finishReason: streamResult.finishReason ?? "end_turn",
                                         reasoning: undefined,
-                                        usage: streamResult.usage
-                                            ? {
-                                                input: streamResult.usage.input ??
-                                                    0,
-                                                output: streamResult.usage
-                                                    .output ?? 0,
-                                                total: streamResult.usage.total ??
-                                                    0,
-                                            }
-                                            : undefined,
+                                        usage: streamResult.usage ? extractUsageFromStreamResult(streamResult.usage) : undefined,
                                         toolCalls: streamResult.toolCalls,
                                     };
-                                    return serializeClaudeResponse(internal, body.model);
+                                    tracer?.end(200, Date.now() - requestStartTime);
+                                    recordFinalSuccess();
+                                    const clientResponse = serializeClaudeResponse(internal, body.model);
+                                    logFinalRequest(200, "", fallback.provider, undefined, undefined, {
+                                        inputTokens: internal.usage?.input,
+                                        outputTokens: internal.usage?.output,
+                                    });
+                                    const clientResponseText = JSON.stringify(clientResponse);
+                                    logProxyBody({
+                                        phase: "client_response",
+                                        headers: { "content-type": "application/json" },
+                                        body: clientResponseText,
+                                        bodySize: Buffer.byteLength(clientResponseText, "utf8"),
+                                        contentType: "application/json",
+                                        responseStatus: 200,
+                                        durationMs: Date.now() - requestStartTime,
+                                    });
+                                    return clientResponse;
                                 }
                                 catch (fallbackErr) {
                                     logger.debug(`[proxy] fallback ${fallback.provider}/${fallback.model} failed: ${fallbackErr instanceof Error ? fallbackErr.message : String(fallbackErr)}`);
-                                    continue;
                                 }
                             }
                             // If no explicit fallback chain is configured, try SDK auto-provider fallback.
-                            if (chain.length === 0) {
+                            // Skip auto-provider when all accounts are rate-limited — the client
+                            // (e.g. Claude Code) understands 429 + Retry-After and will retry on
+                            // its own. Silently routing to a different provider (e.g. OpenAI)
+                            // produces confusing errors like "insufficient_quota".
+                            if (chain.length === 0 && !sawRateLimit) {
                                 try {
                                     logger.always("[proxy] fallback → auto-provider");
                                     const parsed = parseClaudeRequest(body);
-                                    const opts = {
-                                        input: {
-                                            text: parsed.prompt,
-                                            ...(parsed.images.length > 0
-                                                ? { images: parsed.images }
-                                                : {}),
-                                        },
-                                        systemPrompt: parsed.systemPrompt,
-                                        maxTokens: parsed.maxTokens,
-                                        ...(parsed.temperature !== undefined
-                                            ? { temperature: parsed.temperature }
-                                            : {}),
-                                        ...(parsed.topP !== undefined ? { topP: parsed.topP } : {}),
-                                        ...(parsed.topK !== undefined ? { topK: parsed.topK } : {}),
-                                        ...(parsed.stopSequences?.length
-                                            ? { stopSequences: parsed.stopSequences }
-                                            : {}),
-                                        tools: parsed.tools,
-                                        ...(parsed.toolChoice
-                                            ? { toolChoice: parsed.toolChoice }
-                                            : {}),
-                                        ...(parsed.thinkingConfig
-                                            ? { thinkingConfig: parsed.thinkingConfig }
-                                            : {}),
-                                        ...(parsed.conversationMessages?.length
-                                            ? {
-                                                conversationMessages: parsed.conversationMessages.slice(0, -1),
-                                            }
-                                            : {}),
-                                        maxSteps: 1,
-                                    };
+                                    const opts = buildProxyFallbackOptions(parsed);
                                     if (body.stream) {
                                         const streamResult = await ctx.neurolink.stream(opts);
                                         const serializer = new ClaudeStreamSerializer(body.model, 0);
@@ -1299,33 +2326,38 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                             for (const frame of serializer.start()) {
                                                 yield frame;
                                             }
+                                            let collectedText = "";
                                             for await (const chunk of streamResult.stream) {
                                                 const text = extractText(chunk);
                                                 if (text) {
+                                                    collectedText += text;
                                                     for (const frame of serializer.pushDelta(text)) {
                                                         yield frame;
                                                     }
                                                 }
                                             }
                                             // Emit tool_use blocks if model wants to call tools
-                                            if (streamResult.toolCalls?.length) {
-                                                for (const tc of streamResult.toolCalls) {
-                                                    const toolName = tc.toolName ??
-                                                        tc.name ??
-                                                        "unknown";
-                                                    const toolArgs = tc.args ??
-                                                        tc.parameters ??
-                                                        {};
-                                                    for (const frame of serializer.pushToolUse(generateToolUseId(), toolName, toolArgs)) {
+                                            const toolCalls = streamResult.toolCalls ?? [];
+                                            if (!hasTranslatedOutput(collectedText, toolCalls)) {
+                                                throw new Error("Translated provider auto-provider returned no content or tool calls");
+                                            }
+                                            if (toolCalls.length) {
+                                                for (const tc of toolCalls) {
+                                                    const toolName = tc.toolName ?? tc.name ?? "unknown";
+                                                    for (const frame of serializer.pushToolUse(generateToolUseId(), toolName, extractToolArgs(tc))) {
                                                         yield frame;
                                                     }
                                                 }
                                             }
                                             const reason = streamResult.finishReason ?? "end_turn";
-                                            for (const frame of serializer.finish(0, reason)) {
+                                            const resolvedUsage = extractUsageFromStreamResult(streamResult.usage);
+                                            for (const frame of serializer.finish(resolvedUsage.output, reason)) {
                                                 yield frame;
                                             }
                                         }
+                                        tracer?.end(200, Date.now() - requestStartTime);
+                                        recordFinalSuccess();
+                                        logFinalRequest(200, "", "auto-provider");
                                         return sseGenerator();
                                     }
                                     const streamResult = await ctx.neurolink.stream(opts);
@@ -1336,48 +2368,102 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                             collectedText += text;
                                         }
                                     }
+                                    if (!hasTranslatedOutput(collectedText, streamResult.toolCalls)) {
+                                        throw new Error("Translated provider auto-provider returned no content or tool calls");
+                                    }
                                     const internal = {
                                         content: collectedText,
                                         model: streamResult.model,
                                         finishReason: streamResult.finishReason ?? "end_turn",
                                         reasoning: undefined,
-                                        usage: streamResult.usage
-                                            ? {
-                                                input: streamResult.usage.input ??
-                                                    0,
-                                                output: streamResult.usage
-                                                    .output ?? 0,
-                                                total: streamResult.usage.total ??
-                                                    0,
-                                            }
-                                            : undefined,
+                                        usage: streamResult.usage ? extractUsageFromStreamResult(streamResult.usage) : undefined,
                                         toolCalls: streamResult.toolCalls,
                                     };
-                                    return serializeClaudeResponse(internal, body.model);
+                                    tracer?.end(200, Date.now() - requestStartTime);
+                                    recordFinalSuccess();
+                                    const clientResponse = serializeClaudeResponse(internal, body.model);
+                                    logFinalRequest(200, "", "auto-provider", undefined, undefined, {
+                                        inputTokens: internal.usage?.input,
+                                        outputTokens: internal.usage?.output,
+                                    });
+                                    const clientResponseText = JSON.stringify(clientResponse);
+                                    logProxyBody({
+                                        phase: "client_response",
+                                        headers: { "content-type": "application/json" },
+                                        body: clientResponseText,
+                                        bodySize: Buffer.byteLength(clientResponseText, "utf8"),
+                                        contentType: "application/json",
+                                        responseStatus: 200,
+                                        durationMs: Date.now() - requestStartTime,
+                                    });
+                                    return clientResponse;
                                 }
                                 catch (fallbackErr) {
-                                    logger.debug(`[proxy] fallback auto-provider failed: ${fallbackErr instanceof Error
-                                        ? fallbackErr.message
-                                        : String(fallbackErr)}`);
+                                    logger.debug(`[proxy] fallback auto-provider failed: ${fallbackErr instanceof Error ? fallbackErr.message : String(fallbackErr)}`);
                                 }
                             }
                             if (authFailureMessage && !sawRateLimit) {
-                                return buildClaudeError(401, authFailureMessage);
+                                tracer?.setError("authentication_error", authFailureMessage);
+                                tracer?.end(401, Date.now() - requestStartTime);
+                                return buildLoggedClaudeError(401, authFailureMessage);
+                            }
+                            if (invalidRequestFailure) {
+                                tracer?.setError("invalid_request_error", summarizeErrorMessage(invalidRequestFailure.body));
+                                tracer?.end(invalidRequestFailure.status, Date.now() - requestStartTime);
+                                recordFinalError(invalidRequestFailure.status);
+                                try {
+                                    const parsedError = JSON.parse(invalidRequestFailure.body);
+                                    logFinalRequest(invalidRequestFailure.status, "", "final", "invalid_request_error", summarizeErrorMessage(invalidRequestFailure.body));
+                                    logProxyBody({
+                                        phase: "client_response",
+                                        headers: {
+                                            "content-type": invalidRequestFailure.contentType ?? "application/json",
+                                        },
+                                        body: invalidRequestFailure.body,
+                                        bodySize: Buffer.byteLength(invalidRequestFailure.body, "utf8"),
+                                        contentType: invalidRequestFailure.contentType ?? "application/json",
+                                        responseStatus: invalidRequestFailure.status,
+                                        durationMs: Date.now() - requestStartTime,
+                                    });
+                                    return parsedError;
+                                }
+                                catch {
+                                    return buildLoggedClaudeError(invalidRequestFailure.status, summarizeErrorMessage(invalidRequestFailure.body), "invalid_request_error");
+                                }
                             }
                             if ((sawNetworkError || sawTransientFailure) && !sawRateLimit) {
-                                return buildClaudeError(502, `All Anthropic accounts failed due to transient upstream/network errors. Last error: ${lastError instanceof Error
-                                    ? lastError.message
-                                    : String(lastError ?? "unknown")}`);
+                                const msg = `All Anthropic accounts failed due to transient upstream/network errors. Last error: ${lastError instanceof Error ? lastError.message : String(lastError ?? "unknown")}`;
+                                tracer?.setError("transient_error", msg.slice(0, 500));
+                                tracer?.end(502, Date.now() - requestStartTime);
+                                return buildLoggedClaudeError(502, msg);
                             }
                             if (!sawRateLimit) {
-                                return buildClaudeError(502, `All Anthropic accounts failed. Last error: ${lastError instanceof Error
-                                    ? lastError.message
-                                    : String(lastError ?? "unknown")}`);
+                                const msg = `All Anthropic accounts failed. Last error: ${lastError instanceof Error ? lastError.message : String(lastError ?? "unknown")}`;
+                                tracer?.setError("all_accounts_failed", msg.slice(0, 500));
+                                tracer?.end(502, Date.now() - requestStartTime);
+                                return buildLoggedClaudeError(502, msg);
                             }
                             // All accounts AND all fallbacks exhausted — return 429 with Retry-After
                             logger.always(`[proxy] all accounts rate-limited, retry in ${retryAfterSec}s`);
                             const errorBody = buildClaudeError(429, `All accounts rate-limited. Earliest recovery in ${retryAfterSec}s.`, "overloaded_error");
-                            return new Response(JSON.stringify(errorBody), {
+                            tracer?.setError("rate_limit_error", `All accounts rate-limited. Retry in ${retryAfterSec}s.`);
+                            tracer?.end(429, Date.now() - requestStartTime);
+                            recordFinalError(429);
+                            logFinalRequest(429, "", "final", "rate_limit_error", `All accounts rate-limited. Retry in ${retryAfterSec}s.`);
+                            const errorBodyText = JSON.stringify(errorBody);
+                            logProxyBody({
+                                phase: "client_response",
+                                headers: {
+                                    "content-type": "application/json",
+                                    "retry-after": String(retryAfterSec),
+                                },
+                                body: errorBodyText,
+                                bodySize: Buffer.byteLength(errorBodyText, "utf8"),
+                                contentType: "application/json",
+                                responseStatus: 429,
+                                durationMs: Date.now() - requestStartTime,
+                            });
+                            return new Response(errorBodyText, {
                                 status: 429,
                                 headers: {
                                     "content-type": "application/json",
@@ -1387,40 +2473,14 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                         }
                         else {
                             // ─── TRANSLATION MODE (Claude → Other Provider) ───────
+                            tracer?.setMode("full");
                             // Parse into NeuroLink format, call generate/stream, serialize back
                             const parsed = parseClaudeRequest(body);
-                            const historyMessages = parsed.conversationMessages.slice(0, -1);
-                            const options = {
-                                input: {
-                                    text: parsed.prompt,
-                                    ...(parsed.images.length > 0
-                                        ? { images: parsed.images }
-                                        : {}),
-                                },
+                            const attempts = buildProxyTranslationAttempts({
                                 provider: route.provider,
                                 model: route.model,
-                                systemPrompt: parsed.systemPrompt,
-                                maxTokens: parsed.maxTokens,
-                                ...(parsed.temperature !== undefined
-                                    ? { temperature: parsed.temperature }
-                                    : {}),
-                                ...(parsed.topP !== undefined ? { topP: parsed.topP } : {}),
-                                ...(parsed.topK !== undefined ? { topK: parsed.topK } : {}),
-                                ...(parsed.stopSequences?.length
-                                    ? { stopSequences: parsed.stopSequences }
-                                    : {}),
-                                ...(parsed.thinkingConfig
-                                    ? { thinkingConfig: parsed.thinkingConfig }
-                                    : {}),
-                                tools: parsed.tools,
-                                ...(parsed.toolChoice ? { toolChoice: parsed.toolChoice } : {}),
-                                maxSteps: 1,
-                                ...(historyMessages.length > 0
-                                    ? { conversationMessages: historyMessages }
-                                    : {}),
-                            };
+                            }, modelRouter);
                             if (body.stream) {
-                                const streamResult = await ctx.neurolink.stream(options);
                                 const serializer = new ClaudeStreamSerializer(body.model, 0);
                                 const KEEPALIVE_INTERVAL_MS = 15_000; // 15 seconds
                                 // Return a ReadableStream that emits SSE keep-alive comments
@@ -1429,6 +2489,9 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                 const encoder = new TextEncoder();
                                 let translationKeepAliveTimer;
                                 let translationCancelled = false;
+                                let translationSucceeded = false;
+                                let translatedModel;
+                                let finalStreamError = "No translation providers succeeded";
                                 // Hold a reference to the upstream async iterator so
                                 // we can abort it when the client disconnects.
                                 let upstreamIterator;
@@ -1448,59 +2511,85 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                             }
                                         }, KEEPALIVE_INTERVAL_MS);
                                         try {
-                                            const iterable = streamResult.stream;
-                                            upstreamIterator = iterable[Symbol.asyncIterator]();
-                                            // Manually drive the async iterator so we can cancel it
-                                            while (true) {
-                                                if (translationCancelled) {
-                                                    break;
+                                            for (let attemptIndex = 0; attemptIndex < attempts.length; attemptIndex++) {
+                                                const attempt = attempts[attemptIndex];
+                                                if (attemptIndex > 0) {
+                                                    logger.always(`[proxy] fallback → ${attempt.label}`);
                                                 }
-                                                const { value: chunk, done } = await upstreamIterator.next();
-                                                if (done) {
-                                                    break;
-                                                }
-                                                if (translationCancelled) {
-                                                    break;
-                                                }
-                                                const text = extractText(chunk);
-                                                if (text) {
-                                                    for (const frame of serializer.pushDelta(text)) {
-                                                        controller.enqueue(encoder.encode(frame));
+                                                let collectedText = "";
+                                                try {
+                                                    const options = buildProxyFallbackOptions(parsed, attempt.provider
+                                                        ? {
+                                                            provider: attempt.provider,
+                                                            model: attempt.model,
+                                                        }
+                                                        : {});
+                                                    const streamResult = await ctx.neurolink.stream(options);
+                                                    const iterable = streamResult.stream;
+                                                    upstreamIterator = iterable[Symbol.asyncIterator]();
+                                                    while (true) {
+                                                        if (translationCancelled) {
+                                                            break;
+                                                        }
+                                                        const { value: chunk, done } = await upstreamIterator.next();
+                                                        if (done) {
+                                                            break;
+                                                        }
+                                                        if (translationCancelled) {
+                                                            break;
+                                                        }
+                                                        const text = extractText(chunk);
+                                                        if (text) {
+                                                            collectedText += text;
+                                                            for (const frame of serializer.pushDelta(text)) {
+                                                                controller.enqueue(encoder.encode(frame));
+                                                            }
+                                                        }
+                                                    }
+                                                    const toolCalls = streamResult.toolCalls ?? [];
+                                                    if (!hasTranslatedOutput(collectedText, toolCalls)) {
+                                                        finalStreamError = `Translated provider ${attempt.label} returned no content or tool calls`;
+                                                        logger.debug(`[proxy] translation attempt ${attempt.label} returned no content or tool calls`);
+                                                        continue;
                                                     }
+                                                    if (!translationCancelled && toolCalls.length) {
+                                                        for (const tc of toolCalls) {
+                                                            const toolName = tc.toolName ?? tc.name ?? "unknown";
+                                                            for (const frame of serializer.pushToolUse(generateToolUseId(), toolName, extractToolArgs(tc))) {
+                                                                controller.enqueue(encoder.encode(frame));
+                                                            }
+                                                        }
+                                                    }
+                                                    if (!translationCancelled) {
+                                                        const reason = streamResult.finishReason ?? "end_turn";
+                                                        const resolvedUsage = extractUsageFromStreamResult(streamResult.usage);
+                                                        for (const frame of serializer.finish(resolvedUsage.output, reason)) {
+                                                            controller.enqueue(encoder.encode(frame));
+                                                        }
+                                                    }
+                                                    translatedModel = streamResult.model;
+                                                    translationSucceeded = true;
+                                                    return;
                                                 }
-                                            }
-                                            // Emit tool_use blocks if model wants to call tools
-                                            if (!translationCancelled &&
-                                                streamResult.toolCalls?.length) {
-                                                for (const tc of streamResult.toolCalls) {
-                                                    const toolName = tc.toolName ??
-                                                        tc.name ??
-                                                        "unknown";
-                                                    const toolArgs = tc.args ??
-                                                        tc.parameters ??
-                                                        {};
-                                                    for (const frame of serializer.pushToolUse(generateToolUseId(), toolName, toolArgs)) {
-                                                        controller.enqueue(encoder.encode(frame));
+                                                catch (streamErr) {
+                                                    if (translationCancelled) {
+                                                        return;
+                                                    }
+                                                    finalStreamError = streamErr instanceof Error ? streamErr.message : String(streamErr);
+                                                    if (collectedText.trim().length > 0) {
+                                                        logger.always(`[proxy] mid-stream error (translation mode): ${finalStreamError}`);
+                                                        const errorEvent = `event: error\ndata: ${JSON.stringify({ type: "error", error: { type: "api_error", message: `Upstream stream interrupted: ${finalStreamError}` } })}\n\n`;
+                                                        controller.enqueue(encoder.encode(errorEvent));
+                                                        return;
                                                     }
+                                                    logger.debug(`[proxy] translation attempt ${attempt.label} failed: ${finalStreamError}`);
                                                 }
                                             }
                                             if (!translationCancelled) {
-                                                const reason = streamResult.finishReason ?? "end_turn";
-                                                for (const frame of serializer.finish(0, reason)) {
-                                                    controller.enqueue(encoder.encode(frame));
-                                                }
-                                            }
-                                        }
-                                        catch (streamErr) {
-                                            if (translationCancelled) {
-                                                return;
+                                                logger.always(`[proxy] mid-stream error (translation mode): ${finalStreamError}`);
+                                                const errorEvent = `event: error\ndata: ${JSON.stringify({ type: "error", error: { type: "api_error", message: `Upstream stream interrupted: ${finalStreamError}` } })}\n\n`;
+                                                controller.enqueue(encoder.encode(errorEvent));
                                             }
-                                            const errMsg = streamErr instanceof Error
-                                                ? streamErr.message
-                                                : String(streamErr);
-                                            logger.always(`[proxy] mid-stream error (translation mode): ${errMsg}`);
-                                            const errorEvent = `event: error\ndata: ${JSON.stringify({ type: "error", error: { type: "api_error", message: `Upstream stream interrupted: ${errMsg}` } })}\n\n`;
-                                            controller.enqueue(encoder.encode(errorEvent));
                                         }
                                         finally {
                                             if (translationKeepAliveTimer) {
@@ -1509,6 +2598,14 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                             if (!translationCancelled) {
                                                 controller.close();
                                             }
+                                            // OTel: record model substitution if proxy routed to a different model
+                                            if (tracer && translatedModel && translatedModel !== body.model) {
+                                                tracer.setModelSubstitution(body.model, translatedModel);
+                                            }
+                                            if (!translationSucceeded) {
+                                                tracer?.setError("generation_error", finalStreamError.slice(0, 500));
+                                            }
+                                            tracer?.end(200, Date.now() - requestStartTime);
                                         }
                                     },
                                     cancel() {
@@ -1533,34 +2630,72 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                                     },
                                 });
                             }
-                            const streamResult = await ctx.neurolink.stream(options);
-                            let collectedText = "";
-                            for await (const chunk of streamResult.stream) {
-                                const text = extractText(chunk);
-                                if (text) {
-                                    collectedText += text;
+                            let lastAttemptError = "No translation providers succeeded";
+                            for (let attemptIndex = 0; attemptIndex < attempts.length; attemptIndex++) {
+                                const attempt = attempts[attemptIndex];
+                                if (attemptIndex > 0) {
+                                    logger.always(`[proxy] fallback → ${attempt.label}`);
                                 }
-                            }
-                            const internal = {
-                                content: collectedText,
-                                model: streamResult.model,
-                                finishReason: streamResult.finishReason ?? "end_turn",
-                                reasoning: undefined,
-                                usage: streamResult.usage
-                                    ? {
-                                        input: streamResult.usage.input ?? 0,
-                                        output: streamResult.usage.output ?? 0,
-                                        total: streamResult.usage.total ?? 0,
+                                try {
+                                    const options = buildProxyFallbackOptions(parsed, attempt.provider
+                                        ? {
+                                            provider: attempt.provider,
+                                            model: attempt.model,
+                                        }
+                                        : {});
+                                    const streamResult = await ctx.neurolink.stream(options);
+                                    let collectedText = "";
+                                    for await (const chunk of streamResult.stream) {
+                                        const text = extractText(chunk);
+                                        if (text) {
+                                            collectedText += text;
+                                        }
                                     }
-                                    : undefined,
-                                toolCalls: streamResult.toolCalls,
-                            };
-                            return serializeClaudeResponse(internal, body.model);
+                                    if (!hasTranslatedOutput(collectedText, streamResult.toolCalls)) {
+                                        lastAttemptError = `Translated provider ${attempt.label} returned no content or tool calls`;
+                                        logger.debug(`[proxy] translation attempt ${attempt.label} returned no content or tool calls`);
+                                        continue;
+                                    }
+                                    const internal = {
+                                        content: collectedText,
+                                        model: streamResult.model,
+                                        finishReason: streamResult.finishReason ?? "end_turn",
+                                        reasoning: undefined,
+                                        usage: streamResult.usage ? extractUsageFromStreamResult(streamResult.usage) : undefined,
+                                        toolCalls: streamResult.toolCalls,
+                                    };
+                                    // OTel: record model substitution if proxy routed to a different model
+                                    if (tracer && streamResult.model && streamResult.model !== body.model) {
+                                        tracer.setModelSubstitution(body.model, streamResult.model);
+                                    }
+                                    tracer?.end(200, Date.now() - requestStartTime);
+                                    const clientResponse = serializeClaudeResponse(internal, body.model);
+                                    const clientResponseText = JSON.stringify(clientResponse);
+                                    logProxyBody({
+                                        phase: "client_response",
+                                        headers: { "content-type": "application/json" },
+                                        body: clientResponseText,
+                                        bodySize: Buffer.byteLength(clientResponseText, "utf8"),
+                                        contentType: "application/json",
+                                        responseStatus: 200,
+                                        durationMs: Date.now() - requestStartTime,
+                                    });
+                                    return clientResponse;
+                                }
+                                catch (attemptError) {
+                                    lastAttemptError = attemptError instanceof Error ? attemptError.message : String(attemptError);
+                                    logger.debug(`[proxy] translation attempt ${attempt.label} failed: ${lastAttemptError}`);
+                                }
+                            }
+                            throw new Error(lastAttemptError);
                         }
                     }
                     catch (error) {
-                        logger.error(`[claude-proxy] Generation error for ${body.model}: ${error instanceof Error ? error.message : String(error)}`);
-                        return buildClaudeError(502, `Generation failed: ${error instanceof Error ? error.message : "unknown error"}`);
+                        const errMsg = error instanceof Error ? error.message : String(error);
+                        logger.error(`[claude-proxy] Generation error for ${body.model}: ${errMsg}`);
+                        tracer?.setError("generation_error", errMsg.slice(0, 500));
+                        tracer?.end(502, Date.now() - requestStartTime);
+                        return buildLoggedClaudeError(502, `Generation failed: ${error instanceof Error ? error.message : "unknown error"}`);
                     }
                 },
                 description: "Claude-compatible messages endpoint routed through NeuroLink",
@@ -1606,9 +2741,7 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
                     }
                     // Simple estimation using character-to-token heuristic
                     const text = body.messages
-                        .map((m) => typeof m.content === "string"
-                        ? m.content
-                        : JSON.stringify(m.content))
+                        .map((m) => (typeof m.content === "string" ? m.content : JSON.stringify(m.content)))
                         .join(" ");
                     return { input_tokens: Math.ceil(text.length / 4) };
                 },
@@ -1621,6 +2754,26 @@ export function createClaudeProxyRoutes(modelRouter, basePath = "", accountStrat
 // ---------------------------------------------------------------------------
 // Helpers
 // ---------------------------------------------------------------------------
+/**
+ * Extract token usage from a StreamResult.usage object, handling multiple
+ * naming conventions across AI SDK versions and providers:
+ * - AI SDK v6: inputTokens / outputTokens
+ * - AI SDK v4: promptTokens / completionTokens
+ * - NeuroLink internal: input / output
+ */
+function extractUsageFromStreamResult(usage) {
+    if (!usage || typeof usage !== "object") {
+        return { input: 0, output: 0, total: 0 };
+    }
+    const u = usage;
+    const input = (typeof u.inputTokens === "number" ? u.inputTokens : 0) ||
+        (typeof u.promptTokens === "number" ? u.promptTokens : 0) ||
+        (typeof u.input === "number" ? u.input : 0);
+    const output = (typeof u.outputTokens === "number" ? u.outputTokens : 0) ||
+        (typeof u.completionTokens === "number" ? u.completionTokens : 0) ||
+        (typeof u.output === "number" ? u.output : 0);
+    return { input, output, total: input + output };
+}
 /**
  * Extract text content from a stream chunk (handles various chunk formats).
  */
@@ -1744,24 +2897,17 @@ function isRetryableNetworkError(error) {
         normalized.includes("fetch failed") ||
         normalized.includes("socket hang up"));
 }
-const TRANSIENT_HTTP_STATUSES = new Set([
-    408, 500, 502, 503, 504, 520, 521, 522, 523, 524, 525, 526, 529,
-]);
+const TRANSIENT_HTTP_STATUSES = new Set([408, 500, 502, 503, 504, 520, 521, 522, 523, 524, 525, 526, 529]);
 /**
  * Parse a Claude error payload when available.
  */
 export function parseClaudeErrorBody(errBody) {
     try {
         const parsed = JSON.parse(errBody);
-        if (parsed &&
-            parsed.type === "error" &&
-            parsed.error &&
-            typeof parsed.error === "object") {
+        if (parsed && parsed.type === "error" && parsed.error && typeof parsed.error === "object") {
             return {
                 errorType: typeof parsed.error.type === "string" ? parsed.error.type : undefined,
-                message: typeof parsed.error.message === "string"
-                    ? parsed.error.message
-                    : undefined,
+                message: typeof parsed.error.message === "string" ? parsed.error.message : undefined,
             };
         }
     }
@@ -1778,8 +2924,91 @@ export function isInvalidRequestError(status, errBody) {
         return true;
     }
     const parsed = parseClaudeErrorBody(errBody);
-    return (parsed.errorType === "invalid_request_error" ||
-        errBody.includes("invalid_request_error"));
+    return parsed.errorType === "invalid_request_error" || errBody.includes("invalid_request_error");
+}
+function normalizeClaudeRequestForAnthropic(body) {
+    return {
+        ...body,
+        messages: body.messages.map((msg) => {
+            if (typeof msg.content !== "string") {
+                return msg;
+            }
+            return {
+                ...msg,
+                content: [{ type: "text", text: msg.content }],
+            };
+        }),
+    };
+}
+export function buildProxyFallbackOptions(parsed, overrides = {}) {
+    const historyMessages = parsed.conversationMessages.slice(0, -1);
+    const toolNames = Object.keys(parsed.tools);
+    const toolChoice = parsed.toolChoiceName
+        ? { type: "tool", toolName: parsed.toolChoiceName }
+        : parsed.toolChoice;
+    return {
+        input: {
+            text: parsed.prompt,
+            ...(parsed.images.length > 0 ? { images: parsed.images } : {}),
+        },
+        ...(overrides.provider ? { provider: overrides.provider } : {}),
+        ...(overrides.model ? { model: overrides.model } : {}),
+        systemPrompt: parsed.systemPrompt,
+        maxTokens: parsed.maxTokens,
+        ...(parsed.temperature !== undefined ? { temperature: parsed.temperature } : {}),
+        ...(parsed.topP !== undefined ? { topP: parsed.topP } : {}),
+        ...(parsed.topK !== undefined ? { topK: parsed.topK } : {}),
+        ...(parsed.stopSequences?.length ? { stopSequences: parsed.stopSequences } : {}),
+        ...(parsed.thinkingConfig ? { thinkingConfig: parsed.thinkingConfig } : {}),
+        ...(toolNames.length === 0 ? { disableTools: true } : {}),
+        // Claude-compatible requests already declare the exact tool contract.
+        // Filter out NeuroLink's built-in agent tools so translated fallbacks only
+        // expose the tools the client actually knows how to handle.
+        ...(toolNames.length > 0
+            ? {
+                tools: parsed.tools,
+                toolFilter: toolNames,
+            }
+            : {}),
+        ...(toolChoice ? { toolChoice } : {}),
+        ...(historyMessages.length > 0 ? { conversationMessages: historyMessages } : {}),
+        disableInternalFallback: true,
+        skipToolPromptInjection: true,
+        maxSteps: 1,
+    };
+}
+function buildProxyTranslationAttempts(primary, modelRouter) {
+    const attempts = [
+        {
+            provider: primary.provider,
+            model: primary.model,
+            label: `${primary.provider}/${primary.model ?? "unknown"}`,
+        },
+    ];
+    const chain = modelRouter?.getFallbackChain() ?? [];
+    for (const fallback of chain) {
+        if (fallback.provider === primary.provider && fallback.model === primary.model) {
+            continue;
+        }
+        attempts.push({
+            provider: fallback.provider,
+            model: fallback.model,
+            label: `${fallback.provider}/${fallback.model}`,
+        });
+    }
+    if (chain.length === 0) {
+        attempts.push({ label: "auto-provider" });
+    }
+    return attempts;
+}
+function hasTranslatedOutput(collectedText, toolCalls) {
+    return collectedText.trim().length > 0 || (toolCalls?.length ?? 0) > 0;
+}
+function extractToolArgs(toolCall) {
+    return (toolCall.args ??
+        toolCall.parameters ??
+        toolCall.input ??
+        {});
 }
 /**
  * Detect transient upstream failures that should trigger account/provider failover.