npm - gpteam - Versions diffs - 0.1.4 → 0.1.5 - Mend

gpteam 0.1.4 → 0.1.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/README.md CHANGED Viewed

@@ -8,7 +8,7 @@ npx gpteam
 The CLI asks for an API key, validates it with `/v1/models`, detects available models, benchmarks all production ingress endpoints with real API requests, then backs up old files and writes the selected client configuration. The next steps are blocked until the key validation succeeds. Ingress endpoints are benchmarked in parallel, while rounds for the same endpoint remain sequential to keep real API request pressure bounded. Failed benchmark rows show their error reason in the result table.
-Recommendation order is deterministic: success rate first, then a latency score using first SSE event, total completion time, and health-check time. Model prompts use "configurable context" wording because the value is written to the client-side Codex `model_context_window`; it must not be confused with a public marketing total-window label.
+Recommendation order is deterministic: success rate first, then an experience score. The score weighs first SSE event time, total completion time, p90 completion tail latency, and health-check time, so a node with one very slow probe is not recommended just because its median result looks good. Model prompts use "configurable context" wording because the value is written to the client-side Codex `model_context_window`; it must not be confused with a public marketing total-window label.
 Codex config writing follows the same safety pattern as cc-switch: keep top-level fields separate from provider tables, preserve unrelated sections such as MCP servers, and stop before writing if the generated TOML would contain duplicate keys.

package/lib/bench.js CHANGED Viewed

@@ -3,6 +3,16 @@ import https from 'node:https';
 import { performance } from 'node:perf_hooks';
 import { inspectSSEBody } from './sse.js';
+const MISSING_LATENCY_MS = 999999;
+const SCORE_WEIGHTS = {
+  firstEvent: 0.55,
+  total: 0.30,
+  health: 0.05,
+  tailFirstEventPenalty: 0.25,
+  tailTotalPenalty: 0.20,
+  failurePenalty: 4
+};
 export async function benchmarkNodes(nodes, options) {
   const rounds = options.rounds || 3;
   const runBenchmark = options.benchmarkNode || benchmarkNode;
@@ -30,18 +40,24 @@ export async function benchmarkNode(node, options) {
 export function summarizeNode(node, samples) {
   const successful = samples.filter((sample) => sample.ok);
   const streams = successful.map((sample) => sample.stream);
-  return {
+  const firstEvents = streams.map((item) => item.firstEventMs).filter(Number.isFinite);
+  const totals = streams.map((item) => item.totalMs).filter(Number.isFinite);
+  const summary = {
     node,
     samples,
     successRate: samples.length ? successful.length / samples.length : 0,
-    firstEventMs: median(streams.map((item) => item.firstEventMs).filter(Number.isFinite)),
-    totalMs: median(streams.map((item) => item.totalMs).filter(Number.isFinite)),
+    firstEventMs: median(firstEvents),
+    totalMs: median(totals),
+    tailFirstEventMs: percentile(firstEvents, 0.9),
+    tailTotalMs: percentile(totals, 0.9),
     dnsMs: median(streams.map((item) => item.dnsMs).filter(Number.isFinite)),
     tcpMs: median(streams.map((item) => item.tcpMs).filter(Number.isFinite)),
     tlsMs: median(streams.map((item) => item.tlsMs).filter(Number.isFinite)),
     healthMs: median(successful.map((sample) => sample.health.totalMs).filter(Number.isFinite)),
     error: samples.find((sample) => sample.error)?.error || ''
   };
+  summary.experienceScore = scoreResult(summary);
+  return summary;
 }
 export function formatMs(value) {
@@ -53,14 +69,29 @@ export function formatMs(value) {
 function compareResults(a, b) {
   const successDelta = b.successRate - a.successRate;
   if (successDelta !== 0) return successDelta;
-  return scoreLatency(a) - scoreLatency(b);
+  const scoreDelta = a.experienceScore - b.experienceScore;
+  if (scoreDelta !== 0) return scoreDelta;
+  return String(a.node.id || a.node.label).localeCompare(String(b.node.id || b.node.label));
+}
+function scoreResult(result) {
+  if (!result.successRate) return Number.POSITIVE_INFINITY;
+  const firstEventMs = finiteOrFallback(result.firstEventMs);
+  const totalMs = finiteOrFallback(result.totalMs);
+  const healthMs = finiteOrFallback(result.healthMs);
+  const tailFirstEventMs = finiteOrFallback(result.tailFirstEventMs, firstEventMs);
+  const tailTotalMs = finiteOrFallback(result.tailTotalMs, totalMs);
+  const typicalLatency = firstEventMs * SCORE_WEIGHTS.firstEvent
+    + totalMs * SCORE_WEIGHTS.total
+    + healthMs * SCORE_WEIGHTS.health;
+  const tailPenalty = Math.max(0, tailFirstEventMs - firstEventMs) * SCORE_WEIGHTS.tailFirstEventPenalty
+    + Math.max(0, tailTotalMs - totalMs) * SCORE_WEIGHTS.tailTotalPenalty;
+  const failurePenalty = 1 + Math.max(0, 1 - result.successRate) * SCORE_WEIGHTS.failurePenalty;
+  return (typicalLatency + tailPenalty) * failurePenalty;
 }
-function scoreLatency(result) {
-  const firstEventMs = Number.isFinite(result.firstEventMs) ? result.firstEventMs : 999999;
-  const totalMs = Number.isFinite(result.totalMs) ? result.totalMs : 999999;
-  const healthMs = Number.isFinite(result.healthMs) ? result.healthMs : 999999;
-  return firstEventMs * 0.6 + totalMs * 0.35 + healthMs * 0.05;
+function finiteOrFallback(value, fallback = MISSING_LATENCY_MS) {
+  return Number.isFinite(value) ? value : fallback;
 }
 async function measureHealth(url) {
@@ -168,3 +199,10 @@ function median(values) {
   const middle = Math.floor(sorted.length / 2);
   return sorted.length % 2 ? sorted[middle] : (sorted[middle - 1] + sorted[middle]) / 2;
 }
+function percentile(values, ratio) {
+  if (!values.length) return NaN;
+  const sorted = [...values].sort((a, b) => a - b);
+  const index = Math.min(sorted.length - 1, Math.max(0, Math.ceil(sorted.length * ratio) - 1));
+  return sorted[index];
+}

package/lib/cli.js CHANGED Viewed

@@ -35,7 +35,7 @@ export async function runCli(argv = []) {
     console.log('\n开始真实测速：GET /api/health + POST /v1/responses stream=true');
     console.log('测速会按入口并行执行，每个入口内部仍按轮次顺序执行，避免同时打出过多真实请求。');
-    console.log('推荐规则：成功率优先，其次按首包、完成、健康检查的综合延迟排序。');
+    console.log('推荐规则：成功率优先，其次按首包、完成、尾延迟和健康检查计算体验分，分数越低越好。');
     console.log(`模型：${model.id}，测速输出上限：${maxOutputTokens}`);
     const results = await benchmarkNodes(INGRESS_NODES, {
       apiKey,
@@ -97,12 +97,14 @@ export function printResults(results) {
     formatMs(item.tlsMs),
     formatMs(item.firstEventMs),
     formatMs(item.totalMs),
+    formatMs(item.tailTotalMs),
     `${Math.round(item.successRate * 100)}%`,
+    formatScore(item.experienceScore),
     formatMs(item.healthMs),
     item === recommended ? '推荐' : '-',
     item.error || '-'
   ]);
-  const header = ['节点', 'DNS', 'TCP', 'TLS', '首包', '完成', '成功率', '健康检查', '推荐', '错误'];
+  const header = ['节点', 'DNS', 'TCP', 'TLS', '首包', '完成', '尾延迟', '成功率', '体验分', '健康检查', '推荐', '错误'];
   const widths = header.map((name, i) => Math.max(displayWidth(name), ...rows.map((row) => displayWidth(row[i]))) + 2);
   console.log('');
   console.log(formatRow(header, widths));
@@ -173,6 +175,10 @@ function displayWidth(value) {
   return Array.from(String(value)).reduce((sum, char) => sum + (char.charCodeAt(0) > 255 ? 2 : 1), 0);
 }
+function formatScore(value) {
+  return Number.isFinite(value) ? String(Math.round(value)) : '-';
+}
 function clamp(value, min, max) {
   if (!Number.isFinite(value)) return max;
   return Math.max(min, Math.min(max, Math.floor(value)));

package/lib/help.js CHANGED Viewed

@@ -1,5 +1,5 @@
 export const PACKAGE_NAME = 'gpteam';
-export const PACKAGE_VERSION = '0.1.4';
+export const PACKAGE_VERSION = '0.1.5';
 export function getHelpText() {
   return [

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "gpteam",
-  "version": "0.1.4",
+  "version": "0.1.5",
   "description": "GPTeam API interactive client configurator and ingress benchmark CLI.",
   "type": "module",
   "bin": {