npm - openclaw-autoproxy - Versions diffs - 1.0.5 → 1.0.7 - Mend

openclaw-autoproxy 1.0.5 → 1.0.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

package/README.md +1 -0
package/README.zh-CN.md +1 -0
package/dist/gateway/model-load-metrics.js +49 -33
package/dist/gateway/proxy.js +12 -5
package/dist/gateway/server-http.js +81 -8
package/package.json +1 -1
package/src/gateway/model-load-metrics.ts +83 -50
package/src/gateway/proxy.ts +14 -5
package/src/gateway/server-http.ts +100 -8

package/README.md CHANGED Viewed

@@ -61,6 +61,7 @@ routes:
 - Start: `openclaw-autoproxy start`
 - Dev (watch): `openclaw-autoproxy dev`
 - Help: `openclaw-autoproxy help`
+- Publish: `npm publish --registry=https://registry.npmjs.org --access public`
 Quick run (installed):

package/README.zh-CN.md CHANGED Viewed

@@ -59,6 +59,7 @@ routes:
 - 启动：`openclaw-autoproxy start`
 - 开发（热重载）：`openclaw-autoproxy dev`
 - 帮助：`openclaw-autoproxy help`
+- 发布：`npm publish --registry=https://registry.npmjs.org --access public`
 快速示例（安装并立即启动）：

package/dist/gateway/model-load-metrics.js CHANGED Viewed

@@ -1,14 +1,7 @@
 const DEFAULT_WINDOW_MS = 12 * 60 * 60 * 1000;
 const DEFAULT_MAX_SAMPLES_PER_MODEL = 5000;
+export const DEFAULT_MODEL_HEALTH_WINDOW_MS = DEFAULT_WINDOW_MS;
 const modelSamples = new Map();
-function quantileFromSorted(values, q) {
-    if (values.length === 0) {
-        return 0;
-    }
-    const clampedQ = Math.max(0, Math.min(1, q));
-    const index = Math.floor((values.length - 1) * clampedQ);
-    return values[index] ?? values[values.length - 1] ?? 0;
-}
 function roundMs(value) {
     return Math.round(value * 100) / 100;
 }
@@ -34,17 +27,19 @@ function pruneExpiredSamples(cutoffAt) {
         }
     }
 }
-export function recordModelLoadSample(model, loadMs) {
+export function recordModelRequestSample(model, params) {
     if (!model) {
         return;
     }
-    if (!Number.isFinite(loadMs) || loadMs <= 0) {
+    if (!Number.isFinite(params.responseMs) || params.responseMs < 0) {
         return;
     }
     const now = Date.now();
     const sample = {
         at: now,
-        loadMs,
+        ok: params.ok,
+        responseMs: params.responseMs,
+        statusCode: params.statusCode ?? null,
     };
     const existing = modelSamples.get(model) ?? [];
     existing.push(sample);
@@ -55,31 +50,37 @@ export function recordModelLoadSample(model, loadMs) {
     const cutoffAt = now - DEFAULT_WINDOW_MS;
     pruneExpiredSamples(cutoffAt);
 }
+export function recordModelLoadSample(model, loadMs) {
+    recordModelRequestSample(model, {
+        ok: true,
+        responseMs: loadMs,
+        statusCode: 200,
+    });
+}
 function summarizeModel(model, samples) {
     if (samples.length === 0) {
         return null;
     }
-    const loadValues = samples.map((sample) => sample.loadMs).sort((a, b) => a - b);
-    const total = loadValues.reduce((acc, value) => acc + value, 0);
-    const avgLoadMs = total / loadValues.length;
-    const minLoadMs = loadValues[0] ?? 0;
-    const maxLoadMs = loadValues[loadValues.length - 1] ?? 0;
-    const latestAt = samples[samples.length - 1]?.at ?? Date.now();
+    const accessCount = samples.length;
+    const successCount = samples.reduce((count, sample) => count + (sample.ok ? 1 : 0), 0);
+    const totalResponseMs = samples.reduce((total, sample) => total + sample.responseMs, 0);
+    const lastSample = samples[samples.length - 1] ?? null;
+    const avgResponseMs = totalResponseMs / accessCount;
+    const successRatePct = accessCount > 0 ? (successCount / accessCount) * 100 : 0;
     return {
         model,
-        sampleCount: samples.length,
-        avgLoadMs: roundMs(avgLoadMs),
-        p50LoadMs: roundMs(quantileFromSorted(loadValues, 0.5)),
-        p95LoadMs: roundMs(quantileFromSorted(loadValues, 0.95)),
-        minLoadMs: roundMs(minLoadMs),
-        maxLoadMs: roundMs(maxLoadMs),
-        lastSeenAt: new Date(latestAt).toISOString(),
+        accessCount,
+        avgResponseMs: roundMs(avgResponseMs),
+        lastResponseMs: roundMs(lastSample?.responseMs ?? 0),
+        lastSeenAt: new Date(lastSample?.at ?? Date.now()).toISOString(),
+        lastStatusCode: lastSample?.statusCode ?? null,
+        successCount,
+        successRatePct: roundMs(successRatePct),
     };
 }
-export function getModelLoadRankingHealth(windowMs = DEFAULT_WINDOW_MS) {
+export function getModelHealthWindow(windowMs = DEFAULT_WINDOW_MS) {
     const normalizedWindowMs = Number.isFinite(windowMs) && windowMs > 0 ? windowMs : DEFAULT_WINDOW_MS;
-    const now = Date.now();
-    const cutoffAt = now - normalizedWindowMs;
+    const cutoffAt = Date.now() - normalizedWindowMs;
     pruneExpiredSamples(cutoffAt);
     const summaries = [];
     for (const [model, samples] of modelSamples.entries()) {
@@ -96,19 +97,34 @@ export function getModelLoadRankingHealth(windowMs = DEFAULT_WINDOW_MS) {
         }
     }
     summaries.sort((a, b) => {
-        if (a.avgLoadMs !== b.avgLoadMs) {
-            return a.avgLoadMs - b.avgLoadMs;
+        const aIsHealthy = a.lastStatusCode === 200 ? 1 : 0;
+        const bIsHealthy = b.lastStatusCode === 200 ? 1 : 0;
+        if (aIsHealthy !== bIsHealthy) {
+            return bIsHealthy - aIsHealthy;
+        }
+        if (a.avgResponseMs !== b.avgResponseMs) {
+            return a.avgResponseMs - b.avgResponseMs;
         }
-        if (a.p95LoadMs !== b.p95LoadMs) {
-            return a.p95LoadMs - b.p95LoadMs;
+        if (a.accessCount !== b.accessCount) {
+            return b.accessCount - a.accessCount;
         }
-        return b.sampleCount - a.sampleCount;
+        if (a.successRatePct !== b.successRatePct) {
+            return b.successRatePct - a.successRatePct;
+        }
+        return a.model.localeCompare(b.model);
     });
     return {
         windowHours: roundMs(normalizedWindowMs / (60 * 60 * 1000)),
-        rankedModels: summaries.map((entry, index) => ({
+        models: summaries.map((entry, index) => ({
             rank: index + 1,
             ...entry,
         })),
     };
 }
+export function getModelLoadRankingHealth(windowMs = DEFAULT_WINDOW_MS) {
+    const health = getModelHealthWindow(windowMs);
+    return {
+        windowHours: health.windowHours,
+        rankedModels: health.models,
+    };
+}

package/dist/gateway/proxy.js CHANGED Viewed

@@ -2,7 +2,7 @@ import { PassThrough, Readable } from "node:stream";
 import { Agent } from "undici";
 import { createAnthropicMessagesEventStreamTransformer, maybeTransformAnthropicMessagesRequest, transformOpenAiChatCompletionToAnthropicMessage, transformUpstreamErrorToAnthropicError, } from "./anthropic-compat.js";
 import { config } from "./config.js";
-import { recordModelLoadSample } from "./model-load-metrics.js";
+import { recordModelRequestSample } from "./model-load-metrics.js";
 const HOP_BY_HOP_HEADERS = new Set([
     "connection",
     "keep-alive",
@@ -586,8 +586,8 @@ export async function proxyRequest(request, response) {
         }
         const requestBody = bodyBuffer ? new Uint8Array(bodyBuffer) : undefined;
         const headers = buildUpstreamHeaders(request.headers, bodyBuffer ? bodyBuffer.length : undefined, selectedRoute);
+        const attemptStartedAt = Date.now();
         try {
-            const attemptStartedAt = Date.now();
             const upstreamResponse = await fetchWithTimeoutAndClientSignal(upstreamUrl, {
                 method,
                 headers,
@@ -595,9 +595,11 @@ export async function proxyRequest(request, response) {
             }, config.timeoutMs, clientSignal);
             const headerLoadMs = Date.now() - attemptStartedAt;
             const modelForMetric = modelId ?? requestedModel;
-            if (upstreamResponse.ok) {
-                recordModelLoadSample(modelForMetric, headerLoadMs);
-            }
+            recordModelRequestSample(modelForMetric, {
+                ok: upstreamResponse.ok,
+                responseMs: headerLoadMs,
+                statusCode: upstreamResponse.status,
+            });
             const contentType = (upstreamResponse.headers.get("content-type") ?? "").toLowerCase();
             const isEventStream = contentType.includes("text/event-stream");
             const isJsonResponse = contentType.includes("application/json");
@@ -753,6 +755,11 @@ export async function proxyRequest(request, response) {
         }
         catch (error) {
             lastError = error;
+            recordModelRequestSample(modelId ?? requestedModel, {
+                ok: false,
+                responseMs: Date.now() - attemptStartedAt,
+                statusCode: null,
+            });
             if (attemptIndex < modelCandidates.length - 1) {
                 continue;
             }

package/dist/gateway/server-http.js CHANGED Viewed

@@ -1,6 +1,6 @@
 import { createServer } from "node:http";
 import { config } from "./config.js";
-import { getModelLoadRankingHealth } from "./model-load-metrics.js";
+import { DEFAULT_MODEL_HEALTH_WINDOW_MS, getModelHealthWindow, } from "./model-load-metrics.js";
 import { proxyRequest } from "./proxy.js";
 function sendJson(response, statusCode, payload) {
     if (response.writableEnded) {
@@ -12,15 +12,79 @@ function sendJson(response, statusCode, payload) {
     response.setHeader("content-length", Buffer.byteLength(body));
     response.end(body);
 }
-function resolvePathname(request) {
+function sendText(response, statusCode, body) {
+    if (response.writableEnded) {
+        return;
+    }
+    response.statusCode = statusCode;
+    response.setHeader("content-type", "text/plain; charset=utf-8");
+    response.setHeader("content-length", Buffer.byteLength(body));
+    response.end(body);
+}
+function resolveRequestUrl(request) {
     const rawUrl = request.url ?? "/";
     try {
-        return new URL(rawUrl, "http://localhost").pathname;
+        return new URL(rawUrl, "http://localhost");
     }
     catch {
-        return rawUrl.startsWith("/") ? rawUrl : `/${rawUrl}`;
+        const normalized = rawUrl.startsWith("/") ? rawUrl : `/${rawUrl}`;
+        return new URL(normalized, "http://localhost");
     }
 }
+function resolvePathname(request) {
+    return resolveRequestUrl(request).pathname;
+}
+function formatTableNumber(value) {
+    if (!Number.isFinite(value)) {
+        return "-";
+    }
+    if (Number.isInteger(value)) {
+        return String(value);
+    }
+    return value.toFixed(2).replace(/\.00$/, "").replace(/(\.\d)0$/, "$1");
+}
+function formatTableDurationMs(value) {
+    if (!Number.isFinite(value)) {
+        return "-";
+    }
+    return String(Math.round(value));
+}
+function padTableCell(value, width, align) {
+    return align === "right" ? value.padStart(width, " ") : value.padEnd(width, " ");
+}
+function buildModelHealthTable(windowHours, models) {
+    const columns = [
+        { header: "Model", align: "left", value: (row) => row.model },
+        {
+            header: "Code",
+            align: "right",
+            value: (row) => row.lastStatusCode === null ? "-" : String(row.lastStatusCode),
+        },
+        { header: "Avg(ms)", align: "right", value: (row) => formatTableDurationMs(row.avgResponseMs) },
+        { header: "Last(ms)", align: "right", value: (row) => formatTableDurationMs(row.lastResponseMs) },
+        { header: "Count", align: "right", value: (row) => String(row.accessCount) },
+        { header: "OK%", align: "right", value: (row) => `${formatTableNumber(row.successRatePct)}%` },
+    ];
+    const widths = columns.map((column) => {
+        const rowWidths = models.map((row) => column.value(row).length);
+        return Math.max(column.header.length, ...rowWidths, 1);
+    });
+    const header = columns
+        .map((column, index) => padTableCell(column.header, widths[index] ?? column.header.length, column.align))
+        .join(" | ");
+    const divider = widths.map((width) => "-".repeat(width)).join("-+-");
+    const rows = models.map((row) => columns
+        .map((column, index) => padTableCell(column.value(row), widths[index] ?? 0, column.align))
+        .join(" | "));
+    return [
+        `Gateway Health (last ${formatTableNumber(windowHours)}h)`,
+        `Status: ok`,
+        "",
+        header,
+        divider,
+        ...(rows.length > 0 ? rows : ["No model traffic recorded in the last 12 hours."]),
+    ].join("\n");
+}
 function isGatewayApiPath(pathname) {
     return (pathname === "/v1" ||
         pathname.startsWith("/v1/") ||
@@ -29,15 +93,24 @@ function isGatewayApiPath(pathname) {
 }
 async function handleRequest(request, response) {
     const method = (request.method ?? "GET").toUpperCase();
-    const pathname = resolvePathname(request);
+    const requestUrl = resolveRequestUrl(request);
+    const pathname = requestUrl.pathname;
     if ((method === "GET" || method === "HEAD") && pathname === "/health") {
-        const modelLoadHealth = getModelLoadRankingHealth(12 * 60 * 60 * 1000);
+        const modelHealth = getModelHealthWindow(DEFAULT_MODEL_HEALTH_WINDOW_MS);
+        const tableOutput = buildModelHealthTable(modelHealth.windowHours, modelHealth.models);
+        if (requestUrl.searchParams.get("format")?.toLowerCase() !== "json") {
+            sendText(response, 200, tableOutput);
+            return;
+        }
         sendJson(response, 200, {
             status: "ok",
             retryStatusCodes: Array.from(config.retryStatusCodes),
             enabledRouteCount: Object.keys(config.modelRouteMap).length,
-            modelLoadWindowHours: modelLoadHealth.windowHours,
-            modelLoadRanking: modelLoadHealth.rankedModels,
+            modelHealthWindowHours: modelHealth.windowHours,
+            modelHealth: modelHealth.models,
+            modelHealthTable: tableOutput,
+            modelLoadWindowHours: modelHealth.windowHours,
+            modelLoadRanking: modelHealth.models,
         });
         return;
     }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "openclaw-autoproxy",
-  "version": "1.0.5",
+  "version": "1.0.7",
   "description": "Local model-switching proxy gateway with OpenAI-compatible APIs",
   "type": "module",
   "main": "dist/gateway/server.js",

package/src/gateway/model-load-metrics.ts CHANGED Viewed

@@ -1,39 +1,33 @@
 const DEFAULT_WINDOW_MS = 12 * 60 * 60 * 1000;
 const DEFAULT_MAX_SAMPLES_PER_MODEL = 5000;
-interface ModelLoadSample {
+export const DEFAULT_MODEL_HEALTH_WINDOW_MS = DEFAULT_WINDOW_MS;
+interface ModelRequestSample {
   at: number;
-  loadMs: number;
+  ok: boolean;
+  responseMs: number;
+  statusCode: number | null;
 }
-interface ModelLoadSummary {
+export interface ModelHealthSummary {
   model: string;
-  sampleCount: number;
-  avgLoadMs: number;
-  p50LoadMs: number;
-  p95LoadMs: number;
-  minLoadMs: number;
-  maxLoadMs: number;
+  accessCount: number;
+  avgResponseMs: number;
+  lastResponseMs: number;
   lastSeenAt: string;
+  lastStatusCode: number | null;
+  successCount: number;
+  successRatePct: number;
 }
-const modelSamples = new Map<string, ModelLoadSample[]>();
-function quantileFromSorted(values: number[], q: number): number {
-  if (values.length === 0) {
-    return 0;
-  }
-  const clampedQ = Math.max(0, Math.min(1, q));
-  const index = Math.floor((values.length - 1) * clampedQ);
-  return values[index] ?? values[values.length - 1] ?? 0;
-}
+const modelSamples = new Map<string, ModelRequestSample[]>();
 function roundMs(value: number): number {
   return Math.round(value * 100) / 100;
 }
-function pruneModelSamples(samples: ModelLoadSample[], cutoffAt: number): ModelLoadSample[] {
+function pruneModelSamples(samples: ModelRequestSample[], cutoffAt: number): ModelRequestSample[] {
   let startIndex = 0;
   while (startIndex < samples.length && samples[startIndex] && samples[startIndex].at < cutoffAt) {
@@ -62,19 +56,28 @@ function pruneExpiredSamples(cutoffAt: number): void {
   }
 }
-export function recordModelLoadSample(model: string | null, loadMs: number): void {
+export function recordModelRequestSample(
+  model: string | null,
+  params: {
+    ok: boolean;
+    responseMs: number;
+    statusCode?: number | null;
+  },
+): void {
   if (!model) {
     return;
   }
-  if (!Number.isFinite(loadMs) || loadMs <= 0) {
+  if (!Number.isFinite(params.responseMs) || params.responseMs < 0) {
     return;
   }
   const now = Date.now();
-  const sample: ModelLoadSample = {
+  const sample: ModelRequestSample = {
     at: now,
-    loadMs,
+    ok: params.ok,
+    responseMs: params.responseMs,
+    statusCode: params.statusCode ?? null,
   };
   const existing = modelSamples.get(model) ?? [];
@@ -90,41 +93,48 @@ export function recordModelLoadSample(model: string | null, loadMs: number): voi
   pruneExpiredSamples(cutoffAt);
 }
-function summarizeModel(model: string, samples: ModelLoadSample[]): ModelLoadSummary | null {
+export function recordModelLoadSample(model: string | null, loadMs: number): void {
+  recordModelRequestSample(model, {
+    ok: true,
+    responseMs: loadMs,
+    statusCode: 200,
+  });
+}
+function summarizeModel(model: string, samples: ModelRequestSample[]): ModelHealthSummary | null {
   if (samples.length === 0) {
     return null;
   }
-  const loadValues = samples.map((sample) => sample.loadMs).sort((a, b) => a - b);
-  const total = loadValues.reduce((acc, value) => acc + value, 0);
-  const avgLoadMs = total / loadValues.length;
-  const minLoadMs = loadValues[0] ?? 0;
-  const maxLoadMs = loadValues[loadValues.length - 1] ?? 0;
-  const latestAt = samples[samples.length - 1]?.at ?? Date.now();
+  const accessCount = samples.length;
+  const successCount = samples.reduce((count, sample) => count + (sample.ok ? 1 : 0), 0);
+  const totalResponseMs = samples.reduce((total, sample) => total + sample.responseMs, 0);
+  const lastSample = samples[samples.length - 1] ?? null;
+  const avgResponseMs = totalResponseMs / accessCount;
+  const successRatePct = accessCount > 0 ? (successCount / accessCount) * 100 : 0;
   return {
     model,
-    sampleCount: samples.length,
-    avgLoadMs: roundMs(avgLoadMs),
-    p50LoadMs: roundMs(quantileFromSorted(loadValues, 0.5)),
-    p95LoadMs: roundMs(quantileFromSorted(loadValues, 0.95)),
-    minLoadMs: roundMs(minLoadMs),
-    maxLoadMs: roundMs(maxLoadMs),
-    lastSeenAt: new Date(latestAt).toISOString(),
+    accessCount,
+    avgResponseMs: roundMs(avgResponseMs),
+    lastResponseMs: roundMs(lastSample?.responseMs ?? 0),
+    lastSeenAt: new Date(lastSample?.at ?? Date.now()).toISOString(),
+    lastStatusCode: lastSample?.statusCode ?? null,
+    successCount,
+    successRatePct: roundMs(successRatePct),
   };
 }
-export function getModelLoadRankingHealth(windowMs = DEFAULT_WINDOW_MS): {
+export function getModelHealthWindow(windowMs = DEFAULT_WINDOW_MS): {
   windowHours: number;
-  rankedModels: Array<ModelLoadSummary & { rank: number }>;
+  models: Array<ModelHealthSummary & { rank: number }>;
 } {
   const normalizedWindowMs = Number.isFinite(windowMs) && windowMs > 0 ? windowMs : DEFAULT_WINDOW_MS;
-  const now = Date.now();
-  const cutoffAt = now - normalizedWindowMs;
+  const cutoffAt = Date.now() - normalizedWindowMs;
   pruneExpiredSamples(cutoffAt);
-  const summaries: ModelLoadSummary[] = [];
+  const summaries: ModelHealthSummary[] = [];
   for (const [model, samples] of modelSamples.entries()) {
     const filtered = pruneModelSamples(samples, cutoffAt);
@@ -145,22 +155,45 @@ export function getModelLoadRankingHealth(windowMs = DEFAULT_WINDOW_MS): {
   }
   summaries.sort((a, b) => {
-    if (a.avgLoadMs !== b.avgLoadMs) {
-      return a.avgLoadMs - b.avgLoadMs;
+    const aIsHealthy = a.lastStatusCode === 200 ? 1 : 0;
+    const bIsHealthy = b.lastStatusCode === 200 ? 1 : 0;
+    if (aIsHealthy !== bIsHealthy) {
+      return bIsHealthy - aIsHealthy;
     }
-    if (a.p95LoadMs !== b.p95LoadMs) {
-      return a.p95LoadMs - b.p95LoadMs;
+    if (a.avgResponseMs !== b.avgResponseMs) {
+      return a.avgResponseMs - b.avgResponseMs;
     }
-    return b.sampleCount - a.sampleCount;
+    if (a.accessCount !== b.accessCount) {
+      return b.accessCount - a.accessCount;
+    }
+    if (a.successRatePct !== b.successRatePct) {
+      return b.successRatePct - a.successRatePct;
+    }
+    return a.model.localeCompare(b.model);
   });
   return {
     windowHours: roundMs(normalizedWindowMs / (60 * 60 * 1000)),
-    rankedModels: summaries.map((entry, index) => ({
+    models: summaries.map((entry, index) => ({
       rank: index + 1,
       ...entry,
     })),
   };
 }
+export function getModelLoadRankingHealth(windowMs = DEFAULT_WINDOW_MS): {
+  windowHours: number;
+  rankedModels: Array<ModelHealthSummary & { rank: number }>;
+} {
+  const health = getModelHealthWindow(windowMs);
+  return {
+    windowHours: health.windowHours,
+    rankedModels: health.models,
+  };
+}

package/src/gateway/proxy.ts CHANGED Viewed

@@ -8,7 +8,7 @@ import {
   transformUpstreamErrorToAnthropicError,
 } from "./anthropic-compat.js";
 import { config, type ModelRouteConfig } from "./config.js";
-import { recordModelLoadSample } from "./model-load-metrics.js";
+import { recordModelRequestSample } from "./model-load-metrics.js";
 const HOP_BY_HOP_HEADERS = new Set([
   "connection",
@@ -814,8 +814,9 @@ export async function proxyRequest(request: IncomingMessage, response: ServerRes
       selectedRoute,
     );
+    const attemptStartedAt = Date.now();
     try {
-      const attemptStartedAt = Date.now();
       const upstreamResponse = await fetchWithTimeoutAndClientSignal(
         upstreamUrl,
         {
@@ -829,9 +830,11 @@ export async function proxyRequest(request: IncomingMessage, response: ServerRes
       const headerLoadMs = Date.now() - attemptStartedAt;
       const modelForMetric = modelId ?? requestedModel;
-      if (upstreamResponse.ok) {
-        recordModelLoadSample(modelForMetric, headerLoadMs);
-      }
+      recordModelRequestSample(modelForMetric, {
+        ok: upstreamResponse.ok,
+        responseMs: headerLoadMs,
+        statusCode: upstreamResponse.status,
+      });
       const contentType = (upstreamResponse.headers.get("content-type") ?? "").toLowerCase();
       const isEventStream = contentType.includes("text/event-stream");
@@ -1029,6 +1032,12 @@ export async function proxyRequest(request: IncomingMessage, response: ServerRes
     } catch (error) {
       lastError = error;
+      recordModelRequestSample(modelId ?? requestedModel, {
+        ok: false,
+        responseMs: Date.now() - attemptStartedAt,
+        statusCode: null,
+      });
       if (attemptIndex < modelCandidates.length - 1) {
         continue;
       }

package/src/gateway/server-http.ts CHANGED Viewed

@@ -1,6 +1,10 @@
 import { createServer, type IncomingMessage, type Server, type ServerResponse } from "node:http";
 import { config } from "./config.js";
-import { getModelLoadRankingHealth } from "./model-load-metrics.js";
+import {
+  DEFAULT_MODEL_HEALTH_WINDOW_MS,
+  getModelHealthWindow,
+  type ModelHealthSummary,
+} from "./model-load-metrics.js";
 import { proxyRequest } from "./proxy.js";
 function sendJson(response: ServerResponse, statusCode: number, payload: unknown): void {
@@ -15,16 +19,94 @@ function sendJson(response: ServerResponse, statusCode: number, payload: unknown
   response.end(body);
 }
-function resolvePathname(request: IncomingMessage): string {
+function sendText(response: ServerResponse, statusCode: number, body: string): void {
+  if (response.writableEnded) {
+    return;
+  }
+  response.statusCode = statusCode;
+  response.setHeader("content-type", "text/plain; charset=utf-8");
+  response.setHeader("content-length", Buffer.byteLength(body));
+  response.end(body);
+}
+function resolveRequestUrl(request: IncomingMessage): URL {
   const rawUrl = request.url ?? "/";
   try {
-    return new URL(rawUrl, "http://localhost").pathname;
+    return new URL(rawUrl, "http://localhost");
   } catch {
-    return rawUrl.startsWith("/") ? rawUrl : `/${rawUrl}`;
+    const normalized = rawUrl.startsWith("/") ? rawUrl : `/${rawUrl}`;
+    return new URL(normalized, "http://localhost");
   }
 }
+function resolvePathname(request: IncomingMessage): string {
+  return resolveRequestUrl(request).pathname;
+}
+function formatTableNumber(value: number): string {
+  if (!Number.isFinite(value)) {
+    return "-";
+  }
+  if (Number.isInteger(value)) {
+    return String(value);
+  }
+  return value.toFixed(2).replace(/\.00$/, "").replace(/(\.\d)0$/, "$1");
+}
+function formatTableDurationMs(value: number): string {
+  if (!Number.isFinite(value)) {
+    return "-";
+  }
+  return String(Math.round(value));
+}
+function padTableCell(value: string, width: number, align: "left" | "right"): string {
+  return align === "right" ? value.padStart(width, " ") : value.padEnd(width, " ");
+}
+function buildModelHealthTable(windowHours: number, models: Array<ModelHealthSummary & { rank: number }>): string {
+  const columns = [
+    { header: "Model", align: "left" as const, value: (row: ModelHealthSummary & { rank: number }) => row.model },
+    {
+      header: "Code",
+      align: "right" as const,
+      value: (row: ModelHealthSummary & { rank: number }) =>
+        row.lastStatusCode === null ? "-" : String(row.lastStatusCode),
+    },
+    { header: "Avg(ms)", align: "right" as const, value: (row: ModelHealthSummary & { rank: number }) => formatTableDurationMs(row.avgResponseMs) },
+    { header: "Last(ms)", align: "right" as const, value: (row: ModelHealthSummary & { rank: number }) => formatTableDurationMs(row.lastResponseMs) },
+    { header: "Count", align: "right" as const, value: (row: ModelHealthSummary & { rank: number }) => String(row.accessCount) },
+    { header: "OK%", align: "right" as const, value: (row: ModelHealthSummary & { rank: number }) => `${formatTableNumber(row.successRatePct)}%` },
+  ];
+  const widths = columns.map((column) => {
+    const rowWidths = models.map((row) => column.value(row).length);
+    return Math.max(column.header.length, ...rowWidths, 1);
+  });
+  const header = columns
+    .map((column, index) => padTableCell(column.header, widths[index] ?? column.header.length, column.align))
+    .join(" | ");
+  const divider = widths.map((width) => "-".repeat(width)).join("-+-");
+  const rows = models.map((row) => columns
+    .map((column, index) => padTableCell(column.value(row), widths[index] ?? 0, column.align))
+    .join(" | "));
+  return [
+    `Gateway Health (last ${formatTableNumber(windowHours)}h)`,
+    `Status: ok`,
+    "",
+    header,
+    divider,
+    ...(rows.length > 0 ? rows : ["No model traffic recorded in the last 12 hours."]),
+  ].join("\n");
+}
 function isGatewayApiPath(pathname: string): boolean {
   return (
     pathname === "/v1" ||
@@ -36,17 +118,27 @@ function isGatewayApiPath(pathname: string): boolean {
 async function handleRequest(request: IncomingMessage, response: ServerResponse): Promise<void> {
   const method = (request.method ?? "GET").toUpperCase();
-  const pathname = resolvePathname(request);
+  const requestUrl = resolveRequestUrl(request);
+  const pathname = requestUrl.pathname;
   if ((method === "GET" || method === "HEAD") && pathname === "/health") {
-    const modelLoadHealth = getModelLoadRankingHealth(12 * 60 * 60 * 1000);
+    const modelHealth = getModelHealthWindow(DEFAULT_MODEL_HEALTH_WINDOW_MS);
+    const tableOutput = buildModelHealthTable(modelHealth.windowHours, modelHealth.models);
+    if (requestUrl.searchParams.get("format")?.toLowerCase() !== "json") {
+      sendText(response, 200, tableOutput);
+      return;
+    }
     sendJson(response, 200, {
       status: "ok",
       retryStatusCodes: Array.from(config.retryStatusCodes),
       enabledRouteCount: Object.keys(config.modelRouteMap).length,
-      modelLoadWindowHours: modelLoadHealth.windowHours,
-      modelLoadRanking: modelLoadHealth.rankedModels,
+      modelHealthWindowHours: modelHealth.windowHours,
+      modelHealth: modelHealth.models,
+      modelHealthTable: tableOutput,
+      modelLoadWindowHours: modelHealth.windowHours,
+      modelLoadRanking: modelHealth.models,
     });
     return;
   }