npm - gpteam - Versions diffs - 0.1.3 → 0.1.5 - Mend

gpteam 0.1.3 → 0.1.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/README.md CHANGED Viewed

@@ -8,6 +8,8 @@ npx gpteam
 The CLI asks for an API key, validates it with `/v1/models`, detects available models, benchmarks all production ingress endpoints with real API requests, then backs up old files and writes the selected client configuration. The next steps are blocked until the key validation succeeds. Ingress endpoints are benchmarked in parallel, while rounds for the same endpoint remain sequential to keep real API request pressure bounded. Failed benchmark rows show their error reason in the result table.
+Recommendation order is deterministic: success rate first, then an experience score. The score weighs first SSE event time, total completion time, p90 completion tail latency, and health-check time, so a node with one very slow probe is not recommended just because its median result looks good. Model prompts use "configurable context" wording because the value is written to the client-side Codex `model_context_window`; it must not be confused with a public marketing total-window label.
 Codex config writing follows the same safety pattern as cc-switch: keep top-level fields separate from provider tables, preserve unrelated sections such as MCP servers, and stop before writing if the generated TOML would contain duplicate keys.
 Supported clients:

package/lib/bench.js CHANGED Viewed

@@ -3,6 +3,16 @@ import https from 'node:https';
 import { performance } from 'node:perf_hooks';
 import { inspectSSEBody } from './sse.js';
+const MISSING_LATENCY_MS = 999999;
+const SCORE_WEIGHTS = {
+  firstEvent: 0.55,
+  total: 0.30,
+  health: 0.05,
+  tailFirstEventPenalty: 0.25,
+  tailTotalPenalty: 0.20,
+  failurePenalty: 4
+};
 export async function benchmarkNodes(nodes, options) {
   const rounds = options.rounds || 3;
   const runBenchmark = options.benchmarkNode || benchmarkNode;
@@ -13,7 +23,7 @@ export async function benchmarkNodes(nodes, options) {
     }
     return summarizeNode(node, samples);
   }));
-  return results.sort((a, b) => scoreResult(a) - scoreResult(b));
+  return results.sort(compareResults);
 }
 export async function benchmarkNode(node, options) {
@@ -30,18 +40,24 @@ export async function benchmarkNode(node, options) {
 export function summarizeNode(node, samples) {
   const successful = samples.filter((sample) => sample.ok);
   const streams = successful.map((sample) => sample.stream);
-  return {
+  const firstEvents = streams.map((item) => item.firstEventMs).filter(Number.isFinite);
+  const totals = streams.map((item) => item.totalMs).filter(Number.isFinite);
+  const summary = {
     node,
     samples,
     successRate: samples.length ? successful.length / samples.length : 0,
-    firstEventMs: median(streams.map((item) => item.firstEventMs).filter(Number.isFinite)),
-    totalMs: median(streams.map((item) => item.totalMs).filter(Number.isFinite)),
+    firstEventMs: median(firstEvents),
+    totalMs: median(totals),
+    tailFirstEventMs: percentile(firstEvents, 0.9),
+    tailTotalMs: percentile(totals, 0.9),
     dnsMs: median(streams.map((item) => item.dnsMs).filter(Number.isFinite)),
     tcpMs: median(streams.map((item) => item.tcpMs).filter(Number.isFinite)),
     tlsMs: median(streams.map((item) => item.tlsMs).filter(Number.isFinite)),
     healthMs: median(successful.map((sample) => sample.health.totalMs).filter(Number.isFinite)),
     error: samples.find((sample) => sample.error)?.error || ''
   };
+  summary.experienceScore = scoreResult(summary);
+  return summary;
 }
 export function formatMs(value) {
@@ -50,9 +66,32 @@ export function formatMs(value) {
   return `${(value / 1000).toFixed(2)}s`;
 }
+function compareResults(a, b) {
+  const successDelta = b.successRate - a.successRate;
+  if (successDelta !== 0) return successDelta;
+  const scoreDelta = a.experienceScore - b.experienceScore;
+  if (scoreDelta !== 0) return scoreDelta;
+  return String(a.node.id || a.node.label).localeCompare(String(b.node.id || b.node.label));
+}
 function scoreResult(result) {
-  if (!result.successRate) return Number.MAX_SAFE_INTEGER;
-  return (result.firstEventMs || 999999) + (result.totalMs || 999999) - result.successRate * 1000;
+  if (!result.successRate) return Number.POSITIVE_INFINITY;
+  const firstEventMs = finiteOrFallback(result.firstEventMs);
+  const totalMs = finiteOrFallback(result.totalMs);
+  const healthMs = finiteOrFallback(result.healthMs);
+  const tailFirstEventMs = finiteOrFallback(result.tailFirstEventMs, firstEventMs);
+  const tailTotalMs = finiteOrFallback(result.tailTotalMs, totalMs);
+  const typicalLatency = firstEventMs * SCORE_WEIGHTS.firstEvent
+    + totalMs * SCORE_WEIGHTS.total
+    + healthMs * SCORE_WEIGHTS.health;
+  const tailPenalty = Math.max(0, tailFirstEventMs - firstEventMs) * SCORE_WEIGHTS.tailFirstEventPenalty
+    + Math.max(0, tailTotalMs - totalMs) * SCORE_WEIGHTS.tailTotalPenalty;
+  const failurePenalty = 1 + Math.max(0, 1 - result.successRate) * SCORE_WEIGHTS.failurePenalty;
+  return (typicalLatency + tailPenalty) * failurePenalty;
+}
+function finiteOrFallback(value, fallback = MISSING_LATENCY_MS) {
+  return Number.isFinite(value) ? value : fallback;
 }
 async function measureHealth(url) {
@@ -160,3 +199,10 @@ function median(values) {
   const middle = Math.floor(sorted.length / 2);
   return sorted.length % 2 ? sorted[middle] : (sorted[middle - 1] + sorted[middle]) / 2;
 }
+function percentile(values, ratio) {
+  if (!values.length) return NaN;
+  const sorted = [...values].sort((a, b) => a - b);
+  const index = Math.min(sorted.length - 1, Math.max(0, Math.ceil(sorted.length * ratio) - 1));
+  return sorted[index];
+}

package/lib/cli.js CHANGED Viewed

@@ -35,6 +35,7 @@ export async function runCli(argv = []) {
     console.log('\n开始真实测速：GET /api/health + POST /v1/responses stream=true');
     console.log('测速会按入口并行执行，每个入口内部仍按轮次顺序执行，避免同时打出过多真实请求。');
+    console.log('推荐规则：成功率优先，其次按首包、完成、尾延迟和健康检查计算体验分，分数越低越好。');
     console.log(`模型：${model.id}，测速输出上限：${maxOutputTokens}`);
     const results = await benchmarkNodes(INGRESS_NODES, {
       apiKey,
@@ -96,12 +97,14 @@ export function printResults(results) {
     formatMs(item.tlsMs),
     formatMs(item.firstEventMs),
     formatMs(item.totalMs),
+    formatMs(item.tailTotalMs),
     `${Math.round(item.successRate * 100)}%`,
+    formatScore(item.experienceScore),
     formatMs(item.healthMs),
     item === recommended ? '推荐' : '-',
     item.error || '-'
   ]);
-  const header = ['节点', 'DNS', 'TCP', 'TLS', '首包', '完成', '成功率', '健康检查', '推荐', '错误'];
+  const header = ['节点', 'DNS', 'TCP', 'TLS', '首包', '完成', '尾延迟', '成功率', '体验分', '健康检查', '推荐', '错误'];
   const widths = header.map((name, i) => Math.max(displayWidth(name), ...rows.map((row) => displayWidth(row[i]))) + 2);
   console.log('');
   console.log(formatRow(header, widths));
@@ -123,7 +126,7 @@ async function chooseModel(rl, models, preferred) {
 async function askContextLength(rl, model, preferred) {
   const max = Number(model.contextLength || 400000);
   if (preferred) return clamp(Number(preferred), 1, max);
-  const answer = await rl.question(`请输入上下文窗口（最大 ${max}，输出上限 ${model.maxOutputTokens}，默认 ${max}，回车即选择默认）：`);
+  const answer = await rl.question(`请输入可配置上下文长度（最大 ${max}，输出上限 ${model.maxOutputTokens}，默认 ${max}，回车即选择默认）：`);
   return clamp(Number(answer || max), 1, max);
 }
@@ -172,6 +175,10 @@ function displayWidth(value) {
   return Array.from(String(value)).reduce((sum, char) => sum + (char.charCodeAt(0) > 255 ? 2 : 1), 0);
 }
+function formatScore(value) {
+  return Number.isFinite(value) ? String(Math.round(value)) : '-';
+}
 function clamp(value, min, max) {
   if (!Number.isFinite(value)) return max;
   return Math.max(min, Math.min(max, Math.floor(value)));
@@ -180,7 +187,7 @@ function clamp(value, min, max) {
 export function formatModelLabel(model) {
   const context = Number(model.contextLength || 0);
   const outputTokens = Number(model.maxOutputTokens || 0);
-  return `${model.id}（上下文窗口 ${context}，输出上限 ${outputTokens}）`;
+  return `${model.id}（可配置上下文 ${context}，输出上限 ${outputTokens}）`;
 }
 export function formatNodeLabel(node) {

package/lib/help.js CHANGED Viewed

@@ -1,5 +1,5 @@
 export const PACKAGE_NAME = 'gpteam';
-export const PACKAGE_VERSION = '0.1.3';
+export const PACKAGE_VERSION = '0.1.5';
 export function getHelpText() {
   return [
@@ -13,7 +13,7 @@ export function getHelpText() {
     '  --api-key <key>          预填 API key',
     '  --client <id>            codex / opencode / claude-code / openclaw',
     '  --model <id>             预选模型，例如 gpt-5.5',
-    '  --context <tokens>       预设上下文窗口',
+    '  --context <tokens>       预设可配置上下文长度',
     '  --effort <level>         按模型支持项预选，常见为 none / low / medium / high / xhigh',
     '  --node <id>              jp-direct / jp-split / hk-split / us-split',
     '  --rounds <n>             每个入口测速轮数，默认 3',

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "gpteam",
-  "version": "0.1.3",
+  "version": "0.1.5",
   "description": "GPTeam API interactive client configurator and ingress benchmark CLI.",
   "type": "module",
   "bin": {