npm - llm-simple-router - Versions diffs - 0.1.0 → 0.2.0 - Mend

llm-simple-router 0.1.0 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (67) hide show

package/README.md +12 -14
package/dist/admin/groups.js +25 -0
package/dist/admin/providers.d.ts +0 -1
package/dist/admin/providers.js +16 -13
package/dist/admin/proxy-enhancement.d.ts +7 -0
package/dist/admin/proxy-enhancement.js +39 -0
package/dist/admin/router-keys.d.ts +0 -1
package/dist/admin/router-keys.js +17 -8
package/dist/admin/routes.d.ts +0 -3
package/dist/admin/routes.js +9 -4
package/dist/admin/setup.d.ts +7 -0
package/dist/admin/setup.js +44 -0
package/dist/cli.d.ts +2 -0
package/dist/cli.js +4 -0
package/dist/config.d.ts +1 -4
package/dist/config.js +13 -13
package/dist/db/index.d.ts +5 -2
package/dist/db/index.js +3 -1
package/dist/db/logs.d.ts +5 -2
package/dist/db/logs.js +4 -4
package/dist/db/mappings.d.ts +16 -0
package/dist/db/mappings.js +72 -0
package/dist/db/migrations/014_create_settings.sql +4 -0
package/dist/db/migrations/015_add_original_model.sql +1 -0
package/dist/db/migrations/016_create_session_model_tables.sql +24 -0
package/dist/db/session-states.d.ts +40 -0
package/dist/db/session-states.js +37 -0
package/dist/db/settings.d.ts +4 -0
package/dist/db/settings.js +10 -0
package/dist/index.d.ts +1 -0
package/dist/index.js +53 -13
package/dist/middleware/admin-auth.d.ts +2 -2
package/dist/middleware/admin-auth.js +21 -8
package/dist/middleware/auth.js +46 -1
package/dist/proxy/anthropic.d.ts +0 -1
package/dist/proxy/anthropic.js +2 -2
package/dist/proxy/directive-parser.d.ts +7 -0
package/dist/proxy/directive-parser.js +70 -0
package/dist/proxy/enhancement-handler.d.ts +23 -0
package/dist/proxy/enhancement-handler.js +167 -0
package/dist/proxy/log-helpers.d.ts +41 -0
package/dist/proxy/log-helpers.js +35 -0
package/dist/proxy/mapping-resolver.js +39 -2
package/dist/proxy/model-state.d.ts +28 -0
package/dist/proxy/model-state.js +111 -0
package/dist/proxy/openai.d.ts +0 -1
package/dist/proxy/openai.js +4 -3
package/dist/proxy/proxy-core.d.ts +9 -47
package/dist/proxy/proxy-core.js +215 -344
package/dist/proxy/response-cleaner.d.ts +5 -0
package/dist/proxy/response-cleaner.js +60 -0
package/dist/proxy/strategy/failover.d.ts +1 -1
package/dist/proxy/strategy/failover.js +10 -2
package/dist/proxy/strategy/random.d.ts +1 -1
package/dist/proxy/strategy/random.js +8 -2
package/dist/proxy/strategy/round-robin.d.ts +2 -1
package/dist/proxy/strategy/round-robin.js +13 -2
package/dist/proxy/strategy/targets-rule.d.ts +7 -0
package/dist/proxy/strategy/targets-rule.js +14 -0
package/dist/proxy/strategy/types.d.ts +5 -1
package/dist/proxy/strategy/types.js +3 -0
package/dist/proxy/upstream-call.d.ts +43 -0
package/dist/proxy/upstream-call.js +208 -0
package/dist/utils/password.d.ts +2 -0
package/dist/utils/password.js +14 -0
package/package.json +6 -5
package/.env.example +0 -13

package/dist/proxy/proxy-core.js CHANGED Viewed

@@ -1,18 +1,18 @@
 import { randomUUID } from "crypto";
-import { request as httpRequestFn } from "http";
-import { request as httpsRequestFn } from "https";
-import { PassThrough } from "stream";
 import { getProviderById, insertRequestLog, insertMetrics } from "../db/index.js";
 import { decrypt } from "../utils/crypto.js";
-import { SSEMetricsTransform } from "../metrics/sse-metrics-transform.js";
+import { getSetting } from "../db/settings.js";
 import { MetricsExtractor } from "../metrics/metrics-extractor.js";
+import { getMappingGroup } from "../db/index.js";
 import { resolveMapping } from "./mapping-resolver.js";
 import { retryableCall, buildRetryConfig } from "./retry.js";
+import { SSEMetricsTransform } from "../metrics/sse-metrics-transform.js";
+import { proxyNonStream as upstreamNonStream, proxyStream as upstreamStream, proxyGetRequest as upstreamGet, } from "./upstream-call.js";
+import { insertSuccessLog, insertRejectedLog } from "./log-helpers.js";
+import { applyEnhancement, buildModelInfoTag } from "./enhancement-handler.js";
 // ---------- Constants ----------
-export const UPSTREAM_SUCCESS = 200;
-const HTTPS_DEFAULT_PORT = 443;
-const HTTP_DEFAULT_PORT = 80;
-const UPSTREAM_BAD_GATEWAY = 502;
+const UPSTREAM_SUCCESS = 200;
+const FAILOVER_FAIL_THRESHOLD = 400;
 // ---------- Header utilities ----------
 export const SKIP_UPSTREAM = new Set([
     "host",
@@ -24,12 +24,6 @@ export const SKIP_UPSTREAM = new Set([
     "transfer-encoding",
     "upgrade",
 ]);
-export const SKIP_DOWNSTREAM = new Set([
-    "content-length",
-    "transfer-encoding",
-    "connection",
-    "keep-alive",
-]);
 export function selectHeaders(raw, skip) {
     const out = {};
     for (const [key, value] of Object.entries(raw)) {
@@ -39,9 +33,8 @@ export function selectHeaders(raw, skip) {
     }
     return out;
 }
-// 当前两个 provider 都使用 Bearer token（commit eaa4f7d 将 Anthropic 从 x-api-key 改为 Bearer）
+// 当前两个 provider 都使用 Bearer token
 // 如果未来需要支持其他鉴权方式，需要参数化 header 构造
-/** 构建发往上游的请求 headers：过滤客户端 headers + 注入后端 API key */
 export function buildUpstreamHeaders(clientHeaders, apiKey, payloadBytes) {
     const headers = selectHeaders(clientHeaders, SKIP_UPSTREAM);
     headers["Authorization"] = `Bearer ${apiKey}`;
@@ -51,358 +44,236 @@ export function buildUpstreamHeaders(clientHeaders, apiKey, payloadBytes) {
     }
     return headers;
 }
-// ---------- Request utilities ----------
-/** 根据 URL scheme 选择 http 或 https 模块 */
-export function createUpstreamRequest(url, options) {
-    return url.protocol === "https:" ? httpsRequestFn(options) : httpRequestFn(options);
-}
-/** 从 URL + headers 构造 Node.js http.request 所需的 options */
-export function buildRequestOptions(url, headers, method = "POST") {
-    return {
-        hostname: url.hostname,
-        port: Number(url.port) || (url.protocol === "https:" ? HTTPS_DEFAULT_PORT : HTTP_DEFAULT_PORT),
-        path: url.pathname,
-        method,
-        headers,
-    };
-}
-// ---------- Logging ----------
-/** 插入成功请求日志，供 openai/anthropic 插件共享 */
-export function insertSuccessLog(db, apiType, logId, model, provider, isStream, startTime, reqBody, clientReq, upstreamReq, status, respBody, upHdrs, cliHdrs, isRetry = false, originalRequestId = null, routerKeyId = null) {
-    insertRequestLog(db, {
-        id: logId, api_type: apiType, model, provider_id: provider.id,
-        status_code: status, latency_ms: Date.now() - startTime,
-        is_stream: isStream ? 1 : 0, error_message: null,
-        created_at: new Date().toISOString(), request_body: reqBody,
-        response_body: respBody, client_request: clientReq, upstream_request: upstreamReq,
-        upstream_response: JSON.stringify({ statusCode: status, headers: upHdrs, body: respBody }),
-        client_response: JSON.stringify({ statusCode: status, headers: cliHdrs, body: respBody }),
-        is_retry: isRetry ? 1 : 0, original_request_id: originalRequestId,
-        router_key_id: routerKeyId,
-    });
-}
-// ---------- Non-stream proxy ----------
-export function proxyNonStream(backend, apiKey, body, clientHeaders, upstreamPath) {
-    return new Promise((resolve, reject) => {
-        const url = new URL(`${backend.base_url}${upstreamPath}`);
-        const payload = JSON.stringify(body);
-        const upstreamHeaders = buildUpstreamHeaders(clientHeaders, apiKey, Buffer.byteLength(payload));
-        const options = buildRequestOptions(url, upstreamHeaders);
-        const req = createUpstreamRequest(url, options);
-        req.on("response", (res) => {
-            const chunks = [];
-            res.on("data", (chunk) => chunks.push(chunk));
-            res.on("end", () => {
-                resolve({
-                    statusCode: res.statusCode || UPSTREAM_BAD_GATEWAY,
-                    body: Buffer.concat(chunks).toString("utf-8"),
-                    headers: selectHeaders(res.headers, SKIP_DOWNSTREAM),
-                    sentHeaders: { ...upstreamHeaders },
-                    sentBody: payload,
-                });
-            });
-        });
-        req.on("error", (err) => reject(err));
-        req.write(payload);
-        req.end();
-    });
-}
-// ---------- Stream proxy (SSE) ----------
-export function proxyStream(backend, apiKey, body, clientHeaders, reply, timeoutMs, upstreamPath, metricsTransform) {
-    return new Promise((resolve, reject) => {
-        const url = new URL(`${backend.base_url}${upstreamPath}`);
-        const payload = JSON.stringify(body);
-        const upstreamHeaders = buildUpstreamHeaders(clientHeaders, apiKey, Buffer.byteLength(payload));
-        const options = buildRequestOptions(url, upstreamHeaders);
-        const upstreamReq = createUpstreamRequest(url, options);
-        upstreamReq.on("response", (upstreamRes) => {
-            const statusCode = upstreamRes.statusCode || UPSTREAM_BAD_GATEWAY;
-            if (statusCode !== UPSTREAM_SUCCESS) {
-                // 非200路径：仅返回错误信息，不操作 reply
-                const chunks = [];
-                upstreamRes.on("data", (chunk) => chunks.push(chunk));
-                upstreamRes.on("end", () => {
-                    const errorBody = Buffer.concat(chunks).toString("utf-8");
-                    resolve({
-                        statusCode,
-                        responseBody: errorBody,
-                        upstreamResponseHeaders: selectHeaders(upstreamRes.headers, SKIP_DOWNSTREAM),
-                        sentHeaders: upstreamHeaders,
-                    });
-                });
-                return;
-            }
-            const sseHeaders = selectHeaders(upstreamRes.headers, SKIP_DOWNSTREAM);
-            sseHeaders["Content-Type"] = "text/event-stream";
-            sseHeaders["Cache-Control"] = "no-cache";
-            sseHeaders["Connection"] = "keep-alive";
-            reply.raw.writeHead(statusCode, sseHeaders);
-            const passThrough = new PassThrough();
-            if (metricsTransform) {
-                // 管道: upstreamRes → metricsTransform → passThrough → reply.raw
-                metricsTransform.pipe(passThrough).pipe(reply.raw);
-            }
-            else {
-                passThrough.pipe(reply.raw);
-            }
-            // 管道入口：有 metricsTransform 时写入它，否则直接写 passThrough
-            const pipeEntry = metricsTransform ?? passThrough;
-            const captureChunks = [];
-            let idleTimer = null;
-            let resolved = false;
-            function cleanup() {
-                if (idleTimer)
-                    clearTimeout(idleTimer);
-                idleTimer = null;
-                if (!passThrough.destroyed)
-                    passThrough.destroy();
-                if (metricsTransform && !metricsTransform.destroyed)
-                    metricsTransform.destroy();
-                if (!upstreamRes.destroyed)
-                    upstreamRes.destroy();
-            }
-            /** 从 metricsTransform 中提取指标，供 resolve 时附带 */
-            function collectMetrics(isComplete) {
-                if (!metricsTransform)
-                    return undefined;
-                const result = metricsTransform.getExtractor().getMetrics();
-                if (!isComplete) {
-                    return { ...result, is_complete: 0 };
-                }
-                return result;
-            }
-            reply.raw.on("close", () => {
-                if (!resolved) {
-                    cleanup();
-                    resolve({ statusCode, responseBody: undefined, upstreamResponseHeaders: sseHeaders, sentHeaders: upstreamHeaders, metricsResult: collectMetrics(false) });
-                }
-            });
-            passThrough.on("error", () => {
-                cleanup();
-                if (!resolved) {
-                    resolved = true;
-                    resolve({ statusCode, responseBody: undefined, upstreamResponseHeaders: sseHeaders, sentHeaders: upstreamHeaders, metricsResult: collectMetrics(false) });
-                }
-            });
-            function resetIdleTimer() {
-                if (idleTimer)
-                    clearTimeout(idleTimer);
-                idleTimer = setTimeout(() => {
-                    cleanup();
-                    if (!resolved) {
-                        resolved = true;
-                        resolve({ statusCode, responseBody: undefined, upstreamResponseHeaders: sseHeaders, sentHeaders: upstreamHeaders, metricsResult: collectMetrics(false) });
-                    }
-                }, timeoutMs);
-            }
-            resetIdleTimer();
-            upstreamRes.on("data", (chunk) => {
-                if (resolved)
-                    return;
-                resetIdleTimer();
-                pipeEntry.write(chunk);
-                captureChunks.push(chunk);
-            });
-            upstreamRes.on("end", () => {
-                if (resolved)
-                    return;
-                resolved = true;
-                if (idleTimer)
-                    clearTimeout(idleTimer);
-                pipeEntry.end();
-                reply.raw.end();
-                resolve({
-                    statusCode,
-                    responseBody: Buffer.concat(captureChunks).toString("utf-8"),
-                    upstreamResponseHeaders: sseHeaders,
-                    sentHeaders: upstreamHeaders,
-                    metricsResult: collectMetrics(true),
-                });
-            });
-            upstreamRes.on("error", (err) => {
-                if (resolved)
-                    return;
-                resolved = true;
-                cleanup();
-                reject(err);
-            });
-        });
-        upstreamReq.on("error", (err) => reject(err));
-        upstreamReq.write(payload);
-        upstreamReq.end();
-    });
-}
-// ---------- GET proxy ----------
+// ---------- GET proxy (thin wrapper) ----------
 export function proxyGetRequest(backend, apiKey, clientHeaders, upstreamPath) {
-    return new Promise((resolve, reject) => {
-        const url = new URL(`${backend.base_url}${upstreamPath}`);
-        const headers = buildUpstreamHeaders(clientHeaders, apiKey);
-        const options = buildRequestOptions(url, headers, "GET");
-        const req = createUpstreamRequest(url, options);
-        req.on("response", (res) => {
-            const chunks = [];
-            res.on("data", (chunk) => chunks.push(chunk));
-            res.on("end", () => {
-                resolve({
-                    statusCode: res.statusCode || UPSTREAM_BAD_GATEWAY,
-                    body: Buffer.concat(chunks).toString("utf-8"),
-                    headers: selectHeaders(res.headers, SKIP_DOWNSTREAM),
-                });
-            });
-        });
-        req.on("error", (err) => reject(err));
-        req.end();
-    });
+    return upstreamGet(backend, apiKey, clientHeaders, upstreamPath, buildUpstreamHeaders);
 }
+// ---------- Shared proxy handler ----------
 const HTTP_BAD_GATEWAY = 502;
 /**
- * 共享 POST handler，参数化 apiType/errorFormat/upstreamPath 等差异，
- * 消除 openai.ts / anthropic.ts 中约 120 行重复代码。
+ * 共享 POST handler，参数化 apiType/errorFormat/upstreamPath 等差异。
+ * 当分组策略为 failover 时，在 while 循环中依次尝试不同 target，
+ * 直到成功（或 headers 已发送）才返回。
  */
 export async function handleProxyPost(request, reply, apiType, upstreamPath, errors, deps, options) {
-    const { db, encryptionKey, streamTimeoutMs, retryMaxAttempts, retryBaseDelayMs, matcher } = deps;
+    const { db, streamTimeoutMs, retryMaxAttempts, retryBaseDelayMs, matcher } = deps;
     request.raw.socket.on("error", (err) => request.log.debug({ err }, "client socket error"));
-    const startTime = Date.now();
-    const logId = randomUUID();
-    const routerKeyId = request.routerKey?.id ?? null;
-    const body = request.body;
-    const originalBody = JSON.parse(JSON.stringify(body));
-    const clientModel = body.model || "unknown";
-    const resolved = resolveMapping(db, clientModel, { now: new Date() });
-    if (!resolved) {
-        const e = errors.modelNotFound(clientModel);
-        return reply.status(e.statusCode).send(e.body);
+    const clientModel = request.body.model || "unknown";
+    // 代理增强：指令解析 + 模型替换 + 命令拦截
+    const sessionId = request.headers["x-claude-code-session-id"];
+    const { effectiveModel, originalModel, interceptResponse } = applyEnhancement(db, request, clientModel, sessionId);
+    // 命令拦截（如 select-model）：直接返回，不转发上游
+    if (interceptResponse) {
+        const logId = randomUUID();
+        const isStream = request.body.stream === true;
+        const interceptRespBody = JSON.stringify(interceptResponse.body);
+        insertRequestLog(db, {
+            id: logId, api_type: apiType, model: clientModel, provider_id: "router",
+            status_code: interceptResponse.statusCode, latency_ms: 0,
+            is_stream: isStream ? 1 : 0, error_message: null,
+            created_at: new Date().toISOString(),
+            request_body: JSON.stringify(request.body),
+            response_body: interceptRespBody,
+            client_request: JSON.stringify({ headers: request.headers, body: request.body }),
+            upstream_request: interceptResponse.meta ? JSON.stringify(interceptResponse.meta) : null,
+            client_response: JSON.stringify({ statusCode: interceptResponse.statusCode, body: interceptRespBody }),
+            is_retry: 0, original_request_id: null,
+            router_key_id: request.routerKey?.id ?? null, original_model: null,
+        });
+        return reply.status(interceptResponse.statusCode).send(interceptResponse.body);
     }
-    // 白名单校验
-    const allowedModels = request.routerKey?.allowed_models;
-    if (allowedModels) {
-        try {
-            const models = JSON.parse(allowedModels);
-            if (models.length > 0 && !models.includes(resolved.backend_model)) {
-                const e = errors.modelNotAllowed(resolved.backend_model);
-                return reply.status(e.statusCode).send(e.body);
+    // 查询分组策略（只查一次）
+    const group = getMappingGroup(db, effectiveModel);
+    const isFailover = group?.strategy === "failover";
+    const excludeTargets = [];
+    while (true) {
+        const startTime = Date.now();
+        const logId = randomUUID();
+        const routerKeyId = request.routerKey?.id ?? null;
+        const body = request.body;
+        const originalBody = JSON.parse(JSON.stringify(body));
+        const isStream = body.stream === true;
+        const cliHdrs = request.headers;
+        const resolved = resolveMapping(db, effectiveModel, { now: new Date(), excludeTargets });
+        if (!resolved) {
+            if (isFailover && excludeTargets.length > 0) {
+                return reply;
             }
+            const e = errors.modelNotFound(effectiveModel);
+            insertRejectedLog({ db, logId, apiType, model: effectiveModel, statusCode: e.statusCode,
+                errorMessage: `No mapping found for model '${effectiveModel}'`, startTime, isStream,
+                routerKeyId, originalBody, clientHeaders: cliHdrs, originalModel });
+            return reply.status(e.statusCode).send(e.body);
         }
-        catch {
-            request.log.warn("Invalid allowed_models JSON, allowing all models");
+        // 白名单校验
+        if (excludeTargets.length === 0) {
+            const allowedModels = request.routerKey?.allowed_models;
+            if (allowedModels) {
+                try {
+                    const models = JSON.parse(allowedModels).filter((m) => m.trim() !== "");
+                    if (models.length > 0 && !models.includes(resolved.backend_model)) {
+                        const e = errors.modelNotAllowed(resolved.backend_model);
+                        insertRejectedLog({ db, logId, apiType, model: effectiveModel, statusCode: e.statusCode,
+                            errorMessage: `Model '${resolved.backend_model}' not allowed for this API key`,
+                            startTime, isStream, routerKeyId, originalBody, clientHeaders: cliHdrs,
+                            providerId: resolved.provider_id, originalModel });
+                        return reply.status(e.statusCode).send(e.body);
+                    }
+                }
+                catch {
+                    request.log.warn({ allowedModels: allowedModels?.slice(0, 80) }, "Invalid allowed_models JSON, allowing all models");
+                } // eslint-disable-line no-magic-numbers
+            }
         }
-    }
-    const provider = getProviderById(db, resolved.provider_id);
-    if (!provider || !provider.is_active) {
-        const e = errors.providerUnavailable();
-        return reply.status(e.statusCode).send(e.body);
-    }
-    if (provider.api_type !== apiType) {
-        const e = errors.providerTypeMismatch();
-        return reply.status(e.statusCode).send(e.body);
-    }
-    body.model = resolved.backend_model;
-    const apiKey = decrypt(provider.api_key, encryptionKey);
-    const isStream = body.stream === true;
-    // 允许调用方在发送代理请求前修改 body（如 openai 的 stream_options 注入）
-    options?.beforeSendProxy?.(body, isStream);
-    const reqBodyStr = JSON.stringify(body);
-    const cliHdrs = request.headers;
-    const clientReq = JSON.stringify({ headers: cliHdrs, body: originalBody });
-    const retryConfig = buildRetryConfig(retryMaxAttempts, retryBaseDelayMs, matcher);
-    const upstreamReqBase = JSON.stringify({ url: `${provider.base_url}${upstreamPath}`, headers: buildUpstreamHeaders(cliHdrs, apiKey, Buffer.byteLength(reqBodyStr)), body: reqBodyStr });
-    try {
-        const { result: r, attempts } = isStream
-            ? await retryableCall(() => {
-                const metricsTransform = new SSEMetricsTransform(apiType, startTime);
-                return proxyStream(provider, apiKey, body, cliHdrs, reply, streamTimeoutMs, upstreamPath, metricsTransform);
-            }, retryConfig, reply)
-            : await retryableCall(() => proxyNonStream(provider, apiKey, body, cliHdrs, upstreamPath), retryConfig, reply);
-        // 记录所有尝试的日志
-        let lastSuccessLogId = logId;
-        for (const attempt of attempts) {
-            const isOriginal = attempt.attemptIndex === 0;
-            const attemptLogId = isOriginal ? logId : randomUUID();
-            if (attempt.error) {
-                insertRequestLog(db, {
-                    id: attemptLogId, api_type: apiType, model: clientModel, provider_id: provider.id,
-                    status_code: HTTP_BAD_GATEWAY, latency_ms: attempt.latencyMs,
-                    is_stream: isStream ? 1 : 0, error_message: attempt.error,
-                    created_at: new Date().toISOString(), request_body: reqBodyStr,
-                    client_request: clientReq, upstream_request: upstreamReqBase,
-                    is_retry: isOriginal ? 0 : 1, original_request_id: isOriginal ? null : logId,
-                    router_key_id: routerKeyId,
-                });
+        const provider = getProviderById(db, resolved.provider_id);
+        if (!provider || !provider.is_active) {
+            const e = errors.providerUnavailable();
+            insertRejectedLog({ db, logId, apiType, model: effectiveModel, statusCode: e.statusCode,
+                errorMessage: `Provider '${resolved.provider_id}' unavailable or inactive`,
+                startTime, isStream, routerKeyId, originalBody, clientHeaders: cliHdrs,
+                providerId: resolved.provider_id, originalModel });
+            return reply.status(e.statusCode).send(e.body);
+        }
+        if (provider.api_type !== apiType) {
+            const e = errors.providerTypeMismatch();
+            insertRejectedLog({ db, logId, apiType, model: effectiveModel, statusCode: e.statusCode,
+                errorMessage: `Provider API type mismatch: expected '${apiType}', got '${provider.api_type}'`,
+                startTime, isStream, routerKeyId, originalBody, clientHeaders: cliHdrs,
+                providerId: resolved.provider_id, originalModel });
+            return reply.status(e.statusCode).send(e.body);
+        }
+        body.model = resolved.backend_model;
+        const apiKey = decrypt(provider.api_key, getSetting(db, "encryption_key"));
+        options?.beforeSendProxy?.(body, isStream);
+        const reqBodyStr = JSON.stringify(body);
+        const clientReq = JSON.stringify({ headers: cliHdrs, body: originalBody });
+        const retryConfig = buildRetryConfig(retryMaxAttempts, retryBaseDelayMs, matcher);
+        const upstreamReqBase = JSON.stringify({ url: `${provider.base_url}${upstreamPath}`, headers: buildUpstreamHeaders(cliHdrs, apiKey, Buffer.byteLength(reqBodyStr)), body: reqBodyStr });
+        try {
+            const { result: r, attempts } = isStream
+                ? await retryableCall(() => {
+                    const metricsTransform = new SSEMetricsTransform(apiType, startTime);
+                    return upstreamStream(provider, apiKey, body, cliHdrs, reply, streamTimeoutMs, upstreamPath, buildUpstreamHeaders, metricsTransform);
+                }, retryConfig, reply)
+                : await retryableCall(() => upstreamNonStream(provider, apiKey, body, cliHdrs, upstreamPath, buildUpstreamHeaders), retryConfig, reply);
+            // 记录所有尝试的日志
+            let lastSuccessLogId = logId;
+            for (const attempt of attempts) {
+                const isOriginal = attempt.attemptIndex === 0;
+                const attemptLogId = isOriginal ? logId : randomUUID();
+                if (attempt.error) {
+                    insertRequestLog(db, {
+                        id: attemptLogId, api_type: apiType, model: effectiveModel, provider_id: provider.id,
+                        status_code: HTTP_BAD_GATEWAY, latency_ms: attempt.latencyMs,
+                        is_stream: isStream ? 1 : 0, error_message: attempt.error,
+                        created_at: new Date().toISOString(), request_body: reqBodyStr,
+                        client_request: clientReq, upstream_request: upstreamReqBase,
+                        is_retry: isOriginal ? 0 : 1, original_request_id: isOriginal ? null : logId,
+                        router_key_id: routerKeyId, original_model: originalModel,
+                    });
+                }
+                else if (attempt.statusCode !== UPSTREAM_SUCCESS) {
+                    insertRequestLog(db, {
+                        id: attemptLogId, api_type: apiType, model: effectiveModel, provider_id: provider.id,
+                        status_code: attempt.statusCode, latency_ms: attempt.latencyMs,
+                        is_stream: isStream ? 1 : 0, error_message: null,
+                        created_at: new Date().toISOString(), request_body: reqBodyStr,
+                        response_body: attempt.responseBody, client_request: clientReq, upstream_request: upstreamReqBase,
+                        upstream_response: JSON.stringify({ statusCode: attempt.statusCode, body: attempt.responseBody }),
+                        client_response: JSON.stringify({ statusCode: attempt.statusCode, body: attempt.responseBody }),
+                        is_retry: isOriginal ? 0 : 1, original_request_id: isOriginal ? null : logId,
+                        router_key_id: routerKeyId, original_model: originalModel,
+                    });
+                }
+                else {
+                    const h = isStream
+                        ? (r.upstreamResponseHeaders ?? {})
+                        : (r.headers);
+                    insertSuccessLog(db, { apiType, model: effectiveModel, provider, isStream, startTime,
+                        reqBody: reqBodyStr, clientReq, upstreamReq: upstreamReqBase, id: attemptLogId,
+                        status: r.statusCode, respBody: attempt.responseBody, upHdrs: h, cliHdrs: h,
+                        isRetry: !isOriginal, originalRequestId: isOriginal ? null : logId,
+                        routerKeyId, originalModel });
+                    lastSuccessLogId = attemptLogId;
+                }
             }
-            else if (attempt.statusCode !== UPSTREAM_SUCCESS) {
-                insertRequestLog(db, {
-                    id: attemptLogId, api_type: apiType, model: clientModel, provider_id: provider.id,
-                    status_code: attempt.statusCode, latency_ms: attempt.latencyMs,
-                    is_stream: isStream ? 1 : 0, error_message: null,
-                    created_at: new Date().toISOString(), request_body: reqBodyStr,
-                    response_body: attempt.responseBody, client_request: clientReq, upstream_request: upstreamReqBase,
-                    upstream_response: JSON.stringify({ statusCode: attempt.statusCode, body: attempt.responseBody }),
-                    client_response: JSON.stringify({ statusCode: attempt.statusCode, body: attempt.responseBody }),
-                    is_retry: isOriginal ? 0 : 1, original_request_id: isOriginal ? null : logId,
-                    router_key_id: routerKeyId,
-                });
+            // --- Failover 检查 ---
+            if (isFailover && r.statusCode >= FAILOVER_FAIL_THRESHOLD && !reply.raw.headersSent) {
+                excludeTargets.push(resolved);
+                continue;
             }
-            else {
-                const h = isStream
-                    ? (r.upstreamResponseHeaders ?? {})
-                    : (r.headers);
-                insertSuccessLog(db, apiType, attemptLogId, clientModel, provider, isStream, startTime, reqBodyStr, clientReq, upstreamReqBase, r.statusCode, attempt.responseBody, h, h, !isOriginal, isOriginal ? null : logId, routerKeyId);
-                lastSuccessLogId = attemptLogId;
+            // 发送响应
+            if (isStream) {
+                if (r.statusCode !== UPSTREAM_SUCCESS) {
+                    for (const [k, v] of Object.entries(r.upstreamResponseHeaders ?? {}))
+                        reply.header(k, v);
+                    reply.status(r.statusCode).send(r.responseBody);
+                }
             }
-        }
-        // 将最终结果发送给客户端
-        if (isStream) {
-            if (r.statusCode !== UPSTREAM_SUCCESS) {
-                for (const [k, v] of Object.entries(r.upstreamResponseHeaders ?? {}))
+            else {
+                const pr = r;
+                // 非流式响应：模型替换时注入 router-response 标签
+                if (originalModel && pr.statusCode === UPSTREAM_SUCCESS) {
+                    try {
+                        const bodyObj = JSON.parse(pr.body);
+                        if (bodyObj.content?.[0]?.text) {
+                            bodyObj.content[0].text += `\n\n${buildModelInfoTag(effectiveModel)}`;
+                            pr.body = JSON.stringify(bodyObj);
+                        }
+                    }
+                    catch {
+                        request.log.debug("Failed to inject model-info tag into non-JSON response");
+                    }
+                }
+                for (const [k, v] of Object.entries(pr.headers))
                     reply.header(k, v);
-                reply.status(r.statusCode).send(r.responseBody);
+                return reply.status(pr.statusCode).send(pr.body);
             }
-        }
-        else {
-            const pr = r;
-            for (const [k, v] of Object.entries(pr.headers))
-                reply.header(k, v);
-            return reply.status(pr.statusCode).send(pr.body);
-        }
-        // 仅对最终成功请求采集 metrics
-        if (r.statusCode === UPSTREAM_SUCCESS) {
-            if (isStream) {
-                const streamResult = r;
-                if (streamResult.metricsResult) {
+            // metrics 采集
+            if (r.statusCode === UPSTREAM_SUCCESS) {
+                if (isStream) {
+                    const streamResult = r;
+                    if (streamResult.metricsResult) {
+                        try {
+                            insertMetrics(db, { ...streamResult.metricsResult, request_log_id: lastSuccessLogId, provider_id: provider.id, backend_model: resolved.backend_model, api_type: apiType });
+                        }
+                        catch (err) {
+                            request.log.error({ err }, "Failed to insert metrics");
+                        }
+                    }
+                }
+                else {
                     try {
-                        insertMetrics(db, { ...streamResult.metricsResult, request_log_id: lastSuccessLogId, provider_id: provider.id, backend_model: resolved.backend_model, api_type: apiType });
+                        const mr = MetricsExtractor.fromNonStreamResponse(apiType, r.body);
+                        if (mr)
+                            insertMetrics(db, { ...mr, request_log_id: lastSuccessLogId, provider_id: provider.id, backend_model: resolved.backend_model, api_type: apiType });
                     }
                     catch (err) {
                         request.log.error({ err }, "Failed to insert metrics");
                     }
                 }
             }
-            else {
-                try {
-                    const mr = MetricsExtractor.fromNonStreamResponse(apiType, r.body);
-                    if (mr)
-                        insertMetrics(db, { ...mr, request_log_id: lastSuccessLogId, provider_id: provider.id, backend_model: resolved.backend_model, api_type: apiType });
-                }
-                catch (err) {
-                    request.log.error({ err }, "Failed to insert metrics");
-                }
+            return reply;
+        }
+        catch (err) {
+            const errMsg = err instanceof Error ? err.message : String(err);
+            const sentH = buildUpstreamHeaders(cliHdrs, apiKey, Buffer.byteLength(reqBodyStr));
+            const upstreamReq = JSON.stringify({ url: `${provider.base_url}${upstreamPath}`, headers: sentH, body: reqBodyStr });
+            insertRequestLog(db, {
+                id: logId, api_type: apiType, model: effectiveModel, provider_id: provider.id,
+                status_code: HTTP_BAD_GATEWAY, latency_ms: Date.now() - startTime,
+                is_stream: isStream ? 1 : 0, error_message: errMsg || "Upstream connection failed",
+                created_at: new Date().toISOString(), request_body: reqBodyStr,
+                client_request: clientReq, upstream_request: upstreamReq,
+                router_key_id: routerKeyId, original_model: originalModel,
+            });
+            // --- Failover 检查（异常路径）---
+            if (isFailover && !reply.raw.headersSent) {
+                excludeTargets.push(resolved);
+                continue;
             }
+            const e = errors.upstreamConnectionFailed();
+            return reply.status(e.statusCode).send(e.body);
         }
-        return reply;
-    }
-    catch (err) {
-        const errMsg = err instanceof Error ? err.message : String(err);
-        const sentH = buildUpstreamHeaders(cliHdrs, apiKey, Buffer.byteLength(reqBodyStr));
-        const upstreamReq = JSON.stringify({ url: `${provider.base_url}${upstreamPath}`, headers: sentH, body: reqBodyStr });
-        insertRequestLog(db, {
-            id: logId, api_type: apiType, model: clientModel, provider_id: provider.id,
-            status_code: HTTP_BAD_GATEWAY, latency_ms: Date.now() - startTime,
-            is_stream: isStream ? 1 : 0, error_message: errMsg || "Upstream connection failed",
-            created_at: new Date().toISOString(), request_body: reqBodyStr,
-            client_request: clientReq, upstream_request: upstreamReq,
-            router_key_id: routerKeyId,
-        });
-        const e = errors.upstreamConnectionFailed();
-        return reply.status(e.statusCode).send(e.body);
     }
 }

package/dist/proxy/response-cleaner.d.ts ADDED Viewed

@@ -0,0 +1,5 @@
+/**
+ * 清理历史消息中的路由相关内容（命令消息和 router-response 标签）。
+ * 只清理历史轮次，跳过最后一条 user 消息（当前轮由 directive-parser 处理）。
+ */
+export declare function cleanRouterResponses(body: Record<string, unknown>): Record<string, unknown>;