npm - @openhoo/hoopilot - Versions diffs - 0.7.3 → 0.7.5 - Mend

@openhoo/hoopilot 0.7.3 → 0.7.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (10) hide show

package/README.md CHANGED Viewed

@@ -158,7 +158,7 @@ Incoming `x-request-id` headers are preserved on responses. If a request has no
 Hoopilot tracks token usage, request counts, and latency in memory while the server runs, and can report your GitHub Copilot account quota (premium-request "credit" usage).
-- `GET /metrics` returns Prometheus text (`text/plain; version=0.0.4`). It exposes request counters (`hoopilot_requests_total`), upstream call counters (`hoopilot_upstream_requests_total`), token counters by model and type (`hoopilot_tokens_total{model,type}`), a request-duration histogram (`hoopilot_request_duration_seconds`), an in-flight gauge, and—once `/v1/usage` has been fetched at least once—Copilot quota gauges (`hoopilot_copilot_quota_remaining{category}`, `_entitlement`, `_used`, `_percent_remaining`). Counters reset to zero on restart, which Prometheus handles natively.
+- `GET /metrics` returns Prometheus text (`text/plain; version=0.0.4`). It exposes request counters (`hoopilot_requests_total`), upstream call counters (`hoopilot_upstream_requests_total`), token counters by model and type (`hoopilot_tokens_total{model,type}`), a request-duration histogram (`hoopilot_request_duration_seconds`), an in-flight gauge, and—once `/v1/usage` has been fetched at least once—Copilot quota gauges (`hoopilot_copilot_quota_remaining{category}`, `_entitlement`, `_used`, `_percent_remaining`, `_overage_count`, `_overage_entitlement`, `_unlimited`, `_overage_permitted`, `_has_quota`, `_token_based_billing`, and category reset/snapshot timestamps). Counters reset to zero on restart, which Prometheus handles natively.
 - `GET /v1/usage` returns JSON combining the proxy metrics snapshot with live Copilot quota fetched from GitHub (cached for 60 seconds). If the quota cannot be read, `copilot` is `null` and `copilot_error` explains why, but the proxy metrics are still returned.
 - `hoopilot usage` prints your Copilot plan and quota from the command line.

package/dist/cli.js CHANGED Viewed

@@ -293,22 +293,31 @@ function normalizeCopilotUsage(body) {
 }
 function normalizeQuotaDetail(detail) {
   const entitlement = numberOrUndefined(detail.entitlement);
+  const overageCount = numberOrUndefined(detail.overage_count);
   const remaining = numberOrUndefined(detail.remaining) ?? numberOrUndefined(detail.quota_remaining);
   return removeUndefinedQuota({
     entitlement,
-    overageCount: numberOrUndefined(detail.overage_count),
+    hasQuota: typeof detail.has_quota === "boolean" ? detail.has_quota : void 0,
+    overageCount,
+    overageEntitlement: numberOrUndefined(detail.overage_entitlement),
     overagePermitted: typeof detail.overage_permitted === "boolean" ? detail.overage_permitted : void 0,
     percentRemaining: numberOrUndefined(detail.percent_remaining),
+    quotaId: stringOrUndefined(detail.quota_id),
+    quotaResetAt: stringOrUndefined(detail.quota_reset_at),
     remaining,
+    timestampUtc: stringOrUndefined(detail.timestamp_utc),
+    tokenBasedBilling: typeof detail.token_based_billing === "boolean" ? detail.token_based_billing : void 0,
     unlimited: typeof detail.unlimited === "boolean" ? detail.unlimited : void 0,
-    used: usedFrom(entitlement, remaining)
+    used: usedFrom(entitlement, remaining, overageCount)
   });
 }
-function usedFrom(entitlement, remaining) {
+function usedFrom(entitlement, remaining, overageCount) {
   if (entitlement === void 0 || remaining === void 0) {
     return void 0;
   }
-  return Math.max(0, entitlement - remaining);
+  const base = entitlement - remaining;
+  const overage = remaining === 0 ? overageCount ?? 0 : 0;
+  return Math.max(0, base + overage);
 }
 function numberOrUndefined(value) {
   return typeof value === "number" && Number.isFinite(value) ? value : void 0;
@@ -571,6 +580,12 @@ function isLogLevel(value) {
 // src/openai.ts
 var DEFAULT_MODEL = "gpt-4.1";
+var OpenAICompatibilityError = class extends Error {
+  constructor(message) {
+    super(message);
+    this.name = "OpenAICompatibilityError";
+  }
+};
 function normalizeChatCompletionRequest(request) {
   return removeUndefined({
     ...request,
@@ -578,13 +593,22 @@ function normalizeChatCompletionRequest(request) {
   });
 }
 function completionsRequestToChatCompletion(request) {
+  assertSupportedLegacyCompletionRequest(request);
   return removeUndefined({
+    frequency_penalty: request.frequency_penalty,
+    logit_bias: request.logit_bias,
     max_tokens: request.max_tokens,
-    messages: [{ content: promptToText(request.prompt), role: "user" }],
+    messages: [{ content: legacyPromptToText(request.prompt), role: "user" }],
     model: normalizeRequestedModel(request.model),
+    n: request.n,
+    presence_penalty: request.presence_penalty,
+    seed: request.seed,
+    stop: request.stop,
     stream: request.stream === true,
+    stream_options: request.stream_options,
     temperature: request.temperature,
-    top_p: request.top_p
+    top_p: request.top_p,
+    user: request.user
   });
 }
 function normalizeRequestedModel(model) {
@@ -592,21 +616,21 @@ function normalizeRequestedModel(model) {
   return requested || DEFAULT_MODEL;
 }
 function chatCompletionToCompletion(completion) {
-  const choice = firstChoice(completion);
-  const message = asRecord(choice.message);
   return removeUndefined({
-    choices: [
-      {
+    choices: completionChoices(completion).map((choice, index) => {
+      const message = asRecord(choice.message);
+      return {
         finish_reason: choice.finish_reason ?? "stop",
-        index: 0,
-        logprobs: null,
-        text: contentToText(message.content)
-      }
-    ],
+        index: typeof choice.index === "number" ? choice.index : index,
+        logprobs: choice.logprobs ?? null,
+        text: contentToText(choice.text) || contentToText(message.content)
+      };
+    }),
     created: completion.created ?? epochSeconds(),
     id: completion.id ?? `cmpl_${randomId()}`,
     model: completion.model ?? DEFAULT_MODEL,
     object: "text_completion",
+    system_fingerprint: completion.system_fingerprint,
     usage: completion.usage
   });
 }
@@ -679,11 +703,38 @@ function fallbackModels() {
     }
   ];
 }
-function promptToText(prompt) {
-  if (Array.isArray(prompt)) {
-    return prompt.map((item) => contentToText(item)).join("\n");
+function legacyPromptToText(prompt) {
+  if (typeof prompt === "string") {
+    return prompt;
+  }
+  if (Array.isArray(prompt) && prompt.length === 1 && typeof prompt[0] === "string") {
+    return prompt[0];
+  }
+  throw new OpenAICompatibilityError(
+    "Hoopilot legacy completions compatibility supports exactly one string prompt per request."
+  );
+}
+function assertSupportedLegacyCompletionRequest(request) {
+  if (request.echo === true) {
+    throw new OpenAICompatibilityError(
+      "Hoopilot legacy completions compatibility does not support echo=true."
+    );
+  }
+  if (typeof request.best_of === "number" && request.best_of > 1) {
+    throw new OpenAICompatibilityError(
+      "Hoopilot legacy completions compatibility does not support best_of greater than 1."
+    );
+  }
+  if (typeof request.logprobs === "number" && request.logprobs > 0) {
+    throw new OpenAICompatibilityError(
+      "Hoopilot legacy completions compatibility does not support legacy logprobs."
+    );
+  }
+  if (contentToText(request.suffix)) {
+    throw new OpenAICompatibilityError(
+      "Hoopilot legacy completions compatibility does not support suffix."
+    );
   }
-  return contentToText(prompt);
 }
 function contentToText(content) {
   if (typeof content === "string") {
@@ -741,9 +792,9 @@ function firstNumber(...values) {
   }
   return void 0;
 }
-function firstChoice(completion) {
+function completionChoices(completion) {
   const choices = Array.isArray(completion.choices) ? completion.choices : [];
-  return asRecord(choices[0]);
+  return choices.map((choice) => asRecord(choice));
 }
 function processCompletionSseBlock(block, enqueue, markTerminal) {
   let event = "message";
@@ -775,25 +826,28 @@ function processCompletionSseBlock(block, enqueue, markTerminal) {
     enqueue({ error });
     return;
   }
-  const choice = firstChoice(parsed);
-  const delta = asRecord(choice.delta);
-  const text = contentToText(delta.content);
-  const finishReason = choice.finish_reason ?? null;
+  const choices = completionChoices(parsed).map((choice, index) => {
+    const delta = asRecord(choice.delta);
+    const text = contentToText(delta.content);
+    const finishReason = choice.finish_reason ?? null;
+    if (!text && finishReason === null) {
+      return void 0;
+    }
+    return {
+      finish_reason: finishReason,
+      index: typeof choice.index === "number" ? choice.index : index,
+      logprobs: choice.logprobs ?? null,
+      text
+    };
+  }).filter((choice) => choice !== void 0);
   const usage = asRecord(parsed.usage);
   const hasUsage = Object.keys(usage).length > 0;
-  if (!text && finishReason === null && !hasUsage) {
+  if (choices.length === 0 && !hasUsage) {
     return;
   }
   enqueue(
     removeUndefined({
-      choices: text || finishReason !== null ? [
-        {
-          finish_reason: finishReason,
-          index: typeof choice.index === "number" ? choice.index : 0,
-          logprobs: null,
-          text
-        }
-      ] : [],
+      choices,
       created: typeof parsed.created === "number" ? parsed.created : epochSeconds(),
       id: contentToText(parsed.id) || `cmpl_${randomId()}`,
       model: contentToText(parsed.model) || DEFAULT_MODEL,
@@ -1049,11 +1103,43 @@ var MetricsRegistry = class {
     gauge("remaining", "Remaining quota for the Copilot category.", (q) => q.remaining);
     gauge("entitlement", "Quota entitlement for the Copilot category.", (q) => q.entitlement);
     gauge("used", "Used quota (entitlement minus remaining) for the category.", (q) => q.used);
+    gauge("overage_count", "Overage count for the Copilot category.", (q) => q.overageCount);
+    gauge(
+      "overage_entitlement",
+      "Overage entitlement for the Copilot category.",
+      (q) => q.overageEntitlement
+    );
     gauge(
       "percent_remaining",
       "Percent of quota remaining for the Copilot category.",
       (q) => q.percentRemaining
     );
+    booleanGauge(
+      "unlimited",
+      "Whether the Copilot quota category is unlimited.",
+      (q) => q.unlimited
+    );
+    booleanGauge(
+      "overage_permitted",
+      "Whether overage is permitted for the Copilot category.",
+      (q) => q.overagePermitted
+    );
+    booleanGauge("has_quota", "Whether the Copilot quota category has a quota.", (q) => q.hasQuota);
+    booleanGauge(
+      "token_based_billing",
+      "Whether the Copilot quota category uses token-based billing.",
+      (q) => q.tokenBasedBilling
+    );
+    dateGauge(
+      "category_reset_timestamp_seconds",
+      "Unix epoch of the Copilot category-specific quota reset.",
+      (q) => q.quotaResetAt
+    );
+    dateGauge(
+      "category_snapshot_timestamp_seconds",
+      "Unix epoch of the Copilot category quota snapshot.",
+      (q) => q.timestampUtc
+    );
     const resetMs = usage.quotaResetDate ? Date.parse(usage.quotaResetDate) : Number.NaN;
     if (Number.isFinite(resetMs)) {
       lines.push(
@@ -1072,6 +1158,30 @@ var MetricsRegistry = class {
         })} 1`
       );
     }
+    function booleanGauge(suffix, help, pick) {
+      const present = categories.filter(([, quota]) => pick(quota) !== void 0);
+      if (present.length === 0) {
+        return;
+      }
+      lines.push(`# HELP hoopilot_copilot_quota_${suffix} ${help}`);
+      lines.push(`# TYPE hoopilot_copilot_quota_${suffix} gauge`);
+      for (const [category, quota] of present) {
+        lines.push(
+          `hoopilot_copilot_quota_${suffix}${labels({ category })} ${pick(quota) ? 1 : 0}`
+        );
+      }
+    }
+    function dateGauge(suffix, help, pick) {
+      const present = categories.map(([category, quota]) => [category, Date.parse(pick(quota) ?? "")]).filter(([, timestamp]) => Number.isFinite(timestamp));
+      if (present.length === 0) {
+        return;
+      }
+      lines.push(`# HELP hoopilot_copilot_quota_${suffix} ${help}`);
+      lines.push(`# TYPE hoopilot_copilot_quota_${suffix} gauge`);
+      for (const [category, timestamp] of present) {
+        lines.push(`hoopilot_copilot_quota_${suffix}${labels({ category })} ${timestamp / 1e3}`);
+      }
+    }
   }
 };
 function observeResponseUsage(response, fallbackModel, onUsage, signal) {
@@ -1312,6 +1422,12 @@ function createHoopilotHandler(options = {}) {
           "request body was invalid json"
         );
         return finish(jsonError(400, "invalid_request_error", message));
+      } else if (error instanceof OpenAICompatibilityError) {
+        requestLogger.warn(
+          { err: errorDetails(error), event: "http.request.failed" },
+          "request body used unsupported OpenAI compatibility fields"
+        );
+        return finish(jsonError(400, "invalid_request_error", message));
       } else if (error instanceof RequestBodyTooLargeError) {
         requestLogger.warn(
           { err: errorDetails(error), event: "http.request.failed" },
@@ -1763,8 +1879,8 @@ function metricsResponse(metrics) {
   });
 }
 async function handleUsage(metrics, readUsage, signal) {
-  const proxy = metrics.snapshot();
   const { copilot, error } = await readUsage(signal);
+  const proxy = metrics.snapshot();
   const body = { copilot: copilot ?? null, object: "usage", proxy };
   if (error) {
     body.copilot_error = error;
@@ -1789,10 +1905,10 @@ function createUsageReader(client, metrics, now = Date.now, ttlMs = USAGE_CACHE_
       metrics.recordCopilotQuota(value);
       return { copilot: value };
     } catch (error) {
-      metrics.recordUpstream(usagePath, false);
       if (error instanceof CopilotAuthError) {
         return { error: error.message };
       }
+      metrics.recordUpstream(usagePath, false);
       return { error: errorMessage(error) };
     }
   };