npm - copilot-reverse - Versions diffs - 0.5.5 → 0.7.0 - Mend

copilot-reverse 0.5.5 → 0.7.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/dist/changes.js +52 -0
package/dist/cli/index.js +4 -3
package/dist/supervisor/db.js +10 -6
package/dist/supervisor/index.js +1 -1
package/dist/tui/app.js +4 -0
package/dist/tui/assistant/tools.js +1 -1
package/dist/tui/panels/metrics-agg.js +30 -4
package/dist/tui/slash/commands.js +20 -2
package/dist/version.js +1 -1
package/dist/worker/anthropic-server.js +4 -4
package/dist/worker/openai-server.js +15 -10
package/package.json +2 -2

package/dist/changes.js ADDED Viewed

@@ -0,0 +1,52 @@
+export const APP_CHANGES = [
+    {
+        "version": "0.6.0",
+        "date": "2026-06-29",
+        "summary": "feat(tui): add a `/changes` command listing the 10 most recent releases (version, date, summary) with a link to the full CHANGELOG, and refocus the startup \"what's new\" banner on important messages — it now points to `/changes` instead of advertising a bug fix, and still self-suppresses after 3 launches."
+    },
+    {
+        "version": "0.5.5",
+        "date": "2026-06-29",
+        "summary": "ci: gate PRs on a changeset. A pull request with no file in `.changes/` now fails the `changeset` check, so merges can't silently skip the release (the v0.5.3 freeze). Docs/test-only PRs opt out with a `no-changeset` label."
+    },
+    {
+        "version": "0.5.4",
+        "date": "2026-06-29",
+        "summary": "fix(worker): stop the empty-tool-call loop (\"call: call: call:…\") that froze sessions. Inline-XML blocks that recover no tool are now passed through verbatim instead of silently swallowed; nameless `function_call` items on the /responses path are dropped instead of streamed as a blank `call:`; and the runaway deadline now covers tool-call streams, not just text — a model looping on tool calls is cut cleanly instead of relaying forever."
+    },
+    {
+        "version": "0.5.3",
+        "date": "2026-06-29",
+        "summary": "Fix inline tool-call XML (`<invoke name=…>`) leaking as literal text instead of running. The extractor that recovers these blocks only ran on the chat path when the request declared tools, and never on the Codex `/responses` path. It now runs always-on across both streaming and non-stream paths, so a follow-up turn or a `/responses` model can no longer dump raw XML into the reply."
+    },
+    {
+        "version": "0.5.2",
+        "date": "2026-06-29",
+        "summary": "Fix the daemon going permanently dead during dogfooding. The worker had no `unhandledRejection` handler, so a stray floating rejection silently killed it (exit 1, empty stderr) on Node ≥15; once that happened 5×/60s the supervisor marked it `unhealthy` and gave up forever, leaving a running daemon with a dead worker. The worker now handles `unhandledRejection`, writes the cause to stderr *before* the IPC report (so crashes are no longer blind), the supervisor persists each crash to `crash.log`, and `unhealthy` now recovers: after a 30s cooldown it resets the window and tries again instead of staying down."
+    },
+    {
+        "version": "0.5.1",
+        "date": "2026-06-28",
+        "summary": "Fix the app dropping back to the shell during concurrent use. The TUI and supervisor share one process, but several synchronous throw sites had no handler — most importantly an SSE write to a client socket that died between broadcasts (likely with multiple clients connected), which crashed the whole process. Each broadcast listener is now isolated and a dead SSE connection is dropped instead of retried; `readGhToken` returns null on a corrupt/locked read instead of throwing on the heartbeat tick; and a process-level backstop logs any remaining stray throw/rejection to `~/.copilot-reverse/crash.log` and keeps the TUI alive."
+    },
+    {
+        "version": "0.5.0",
+        "date": "2026-06-28",
+        "summary": "Add a GitHub-token heartbeat: the supervisor now re-checks every ~60s whether the stored GitHub login still works, and the TUI footer shows a live `github ✓` / `✗ /login` badge — so an expired or revoked login surfaces within ~60s instead of only on the next failed request or a manual `/status`. A transient network/rate-limit hiccup is distinguished from a real auth failure, so the badge never flips on a single blip."
+    },
+    {
+        "version": "0.4.0",
+        "date": "2026-06-26",
+        "summary": "Codex `/responses` support, web search via Microsoft Web IQ, and a tool-call recovery fix:"
+    },
+    {
+        "version": "0.3.0",
+        "date": "2026-06-26",
+        "summary": "Restore `web_search` and `web_fetch` for Claude Code through the gateway: the worker now runs these tools internally against Microsoft Web IQ in a transparent agentic loop, and a new `/web-search-support` command stores the WebIQ API key."
+    },
+    {
+        "version": "0.2.1",
+        "date": "2026-06-25",
+        "summary": "Fix `/login` hanging with no output: the device-code prompt is now shown immediately while authorization is pending, instead of being buffered behind the blocking token poll."
+    }
+];

package/dist/cli/index.js CHANGED Viewed

@@ -181,11 +181,12 @@ async function launchTui() {
         }
     });
     const persistedModel = readChatModel(dataDir());
-    // "What's new" banner: MAJOR changes only — keyed by version so each release re-announces, shown
-    // ~3 launches then quiet. Minor fixes/polish do NOT go here; reserve it for things worth noticing.
+    // "What's new" banner: IMPORTANT messages only (new capabilities, things worth noticing) — NOT
+    // bug fixes. Keyed by version so each release re-announces, shown ~3 launches then quiet. The full
+    // list lives behind /changes; this is just a nudge.
     const CHANGE_ID = `v${APP_VERSION}`;
     const changeBanner = shouldShowChange(dataDir(), CHANGE_ID)
-        ? { lines: ["• runaway streams now cut cleanly — no more frozen 'code code code' sessions"] }
+        ? { lines: ["• type /changes to see what's new across recent releases"] }
         : undefined;
     // Startup overview. The token was already validated above (re-auth happens before we get here), so
     // GitHub is connected; web search readiness and configured clients are read from disk.

package/dist/supervisor/db.js CHANGED Viewed

@@ -9,12 +9,16 @@ export function openDb(file) {
       exit_code INTEGER, stderr_tail TEXT NOT NULL, backoff_ms INTEGER NOT NULL, marked_unhealthy INTEGER NOT NULL DEFAULT 0);
     CREATE TABLE IF NOT EXISTS request_log (
       id INTEGER PRIMARY KEY AUTOINCREMENT, ts INTEGER NOT NULL, endpoint TEXT NOT NULL,
-      model TEXT NOT NULL, status INTEGER NOT NULL, latency_ms INTEGER NOT NULL, error TEXT);
+      model TEXT NOT NULL, status INTEGER NOT NULL, latency_ms INTEGER NOT NULL, tokens_in INTEGER, tokens_out INTEGER, error TEXT);
   `);
-    // Migrate request_log tables created before the error column existed.
+    // Migrate request_log tables created before later columns existed.
     const cols = db.prepare(`PRAGMA table_info(request_log)`).all();
     if (!cols.some((c) => c.name === "error"))
         db.exec(`ALTER TABLE request_log ADD COLUMN error TEXT`);
+    if (!cols.some((c) => c.name === "tokens_in"))
+        db.exec(`ALTER TABLE request_log ADD COLUMN tokens_in INTEGER`);
+    if (!cols.some((c) => c.name === "tokens_out"))
+        db.exec(`ALTER TABLE request_log ADD COLUMN tokens_out INTEGER`);
     return db;
 }
 export function recordRestart(db, e) {
@@ -26,10 +30,10 @@ export function listRestarts(db, limit) {
     FROM restart_events ORDER BY ts DESC LIMIT ?`).all(limit);
 }
 export function recordRequest(db, m) {
-    db.prepare(`INSERT INTO request_log (ts, endpoint, model, status, latency_ms, error) VALUES (@ts, @endpoint, @model, @status, @latencyMs, @error)`)
-        .run({ error: null, ...m });
+    db.prepare(`INSERT INTO request_log (ts, endpoint, model, status, latency_ms, tokens_in, tokens_out, error) VALUES (@ts, @endpoint, @model, @status, @latencyMs, @tokensIn, @tokensOut, @error)`)
+        .run({ tokensIn: null, tokensOut: null, error: null, ...m });
 }
 export function recentRequests(db, limit) {
-    return db.prepare(`SELECT ts, endpoint, model, status, latency_ms as latencyMs, error FROM request_log ORDER BY ts DESC LIMIT ?`).all(limit)
-        .map(({ error, ...r }) => (error == null ? r : { ...r, error }));
+    return db.prepare(`SELECT ts, endpoint, model, status, latency_ms as latencyMs, tokens_in as tokensIn, tokens_out as tokensOut, error FROM request_log ORDER BY ts DESC LIMIT ?`).all(limit)
+        .map(({ tokensIn, tokensOut, error, ...r }) => ({ ...r, ...(tokensIn != null ? { tokensIn } : {}), ...(tokensOut != null ? { tokensOut } : {}), ...(error != null ? { error } : {}) }));
 }

package/dist/supervisor/index.js CHANGED Viewed

@@ -29,7 +29,7 @@ export function startSupervisor() {
         },
         onWorkerMessage: (m) => {
             if (m.type === "request-metric") {
-                const sample = { ts: Date.now(), endpoint: m.endpoint, model: m.model, status: m.status, latencyMs: m.latencyMs, error: m.error };
+                const sample = { ts: Date.now(), endpoint: m.endpoint, model: m.model, status: m.status, latencyMs: m.latencyMs, tokensIn: m.tokensIn, tokensOut: m.tokensOut, error: m.error };
                 recordRequest(db, sample);
                 bus.emit("metric", sample);
             }

package/dist/tui/app.js CHANGED Viewed

@@ -267,6 +267,10 @@ export function App({ registry, title, workerState = "starting", initialModel =
                         const tokens = Math.ceil(e.text.length / 4);
                         return (_jsxs(Box, { flexDirection: "column", children: [_jsxs(Text, { color: theme.accent, children: ["\u273D ", _jsxs(Text, { color: theme.muted, children: [frame, " ", loadingVerb(elapsed), "\u2026 (esc to interrupt \u00B7 ", fmtElapsed(elapsed), " \u00B7 \u2193 ", fmtTokens(tokens), " tokens \u00B7 thinking)"] })] }), e.text ? _jsx(Text, { color: color, children: e.text }) : null] }, i));
                     }
+                    // User turns get a clay-on-dark highlight bar so they stand out from muted system notes and
+                    // gray assistant output — a clear visual anchor for "this is what I said".
+                    if (e.type === "user")
+                        return _jsx(Box, { marginTop: 1, children: _jsx(Text, { backgroundColor: theme.accent, color: "black", bold: true, children: ` ${e.text.replace(/^›\s*/, "")} ` }) }, i);
                     return _jsx(Text, { color: color, children: e.text }, i);
                 }) }), body, _jsxs(Box, { flexDirection: "column", paddingX: 1, children: [_jsxs(Box, { children: [github && _jsxs(_Fragment, { children: [_jsx(Text, { color: theme.muted, children: "github " }), _jsx(Text, { color: github === "connected" ? theme.ready : theme.error, children: github === "connected" ? "✓" : "✗ /login" })] }), _jsxs(Text, { color: theme.muted, children: [github ? "  ·  " : "", "daemon "] }), _jsx(Text, { color: stateColor[state], children: state })] }), _jsxs(Box, { children: [_jsx(Text, { color: theme.muted, children: "web " }), _jsx(Text, { color: webBackend === "unavailable" ? theme.muted : theme.ready, children: webBackend === "webiq" ? "✓ webiq" : webBackend === "copilot" ? "✓ copilot" : "✗ /webiq" }), _jsx(Text, { color: theme.muted, children: "  \u00B7  " }), _jsx(ClientBadge, { name: "claude", status: status.claude }), _jsx(Text, { color: theme.muted, children: "  " }), _jsx(ClientBadge, { name: "codex", status: status.codex }), _jsx(Text, { color: theme.muted, children: "  \u00B7  /help" })] })] })] }));
 }

package/dist/tui/assistant/tools.js CHANGED Viewed

@@ -31,7 +31,7 @@ export function buildActions(client) {
             const a = aggregate(await client.requests());
             if (!a.total)
                 return "no requests yet";
-            return `requests: ${a.total}, errors: ${a.errors}; ` + a.byModel.map((r) => `${r.model} n=${r.count} avg=${r.avgMs}ms`).join("; ");
+            return `requests: ${a.total}, errors: ${a.errors}, tokens: ${a.tokensIn}↑/${a.tokensOut}↓, est. cost: $${a.costUsd.toFixed(3)}; ` + a.byModel.map((r) => `${r.model} n=${r.count} avg=${r.avgMs}ms`).join("; ");
         },
     };
 }

package/dist/tui/panels/metrics-agg.js CHANGED Viewed

@@ -1,21 +1,47 @@
 // A request "failed" if it returned a 4xx/5xx OR carried an error message — runaway streams finish
 // 200 but tag an error (model degenerated, cut early), and those are exactly what we want to surface.
 const isError = (s) => s.status >= 400 || s.error != null;
+// Indicative $/1M-token list prices (in, out) used ONLY to estimate spend — Copilot is flat-fee, so
+// this is "what these tokens would cost at provider list price", not a real bill. Matched by substring;
+// unknown models fall back to a mid GPT-4o-class rate. Update as needed; precision isn't the point.
+const PRICING = [
+    { match: "opus", in: 15, out: 75 },
+    { match: "sonnet", in: 3, out: 15 },
+    { match: "haiku", in: 0.8, out: 4 },
+    { match: "gpt-5", in: 1.25, out: 10 },
+    { match: "gpt-4o-mini", in: 0.15, out: 0.6 },
+    { match: "gpt-4o", in: 2.5, out: 10 },
+    { match: "o1", in: 15, out: 60 },
+];
+const RATE_FALLBACK = { in: 2.5, out: 10 };
+const rate = (model) => PRICING.find((p) => model.toLowerCase().includes(p.match)) ?? RATE_FALLBACK;
+export function estimateCost(model, tokensIn, tokensOut) {
+    const r = rate(model);
+    return (tokensIn * r.in + tokensOut * r.out) / 1_000_000;
+}
 export function aggregate(samples) {
     const map = new Map();
     let errors = 0;
     for (const s of samples) {
         if (isError(s))
             errors++;
-        const m = map.get(s.model) ?? { count: 0, sum: 0 };
+        const m = map.get(s.model) ?? { count: 0, sum: 0, tin: 0, tout: 0 };
         m.count++;
         m.sum += s.latencyMs;
+        m.tin += s.tokensIn ?? 0;
+        m.tout += s.tokensOut ?? 0;
         map.set(s.model, m);
     }
+    const byModel = [...map.entries()].map(([model, v]) => ({
+        model, count: v.count, avgMs: Math.round(v.sum / v.count),
+        tokensIn: v.tin, tokensOut: v.tout, costUsd: estimateCost(model, v.tin, v.tout),
+    }));
     return {
-        total: samples.length,
-        errors,
-        byModel: [...map.entries()].map(([model, v]) => ({ model, count: v.count, avgMs: Math.round(v.sum / v.count) })),
+        total: samples.length, errors,
+        tokensIn: byModel.reduce((n, r) => n + r.tokensIn, 0),
+        tokensOut: byModel.reduce((n, r) => n + r.tokensOut, 0),
+        costUsd: byModel.reduce((n, r) => n + r.costUsd, 0),
+        byModel,
     };
 }
 // The failed requests (status >= 400 or any tagged error), newest-first, capped at `limit`. This is

package/dist/tui/slash/commands.js CHANGED Viewed

@@ -3,6 +3,7 @@ import { claudeCodeConfig, codexConfig } from "../setup/clients.js";
 import { aggregate, recentErrors } from "../panels/metrics-agg.js";
 import { openUrl as defaultOpenUrl } from "../../shared/open-url.js";
 import { buildIssueUrl, PLACEHOLDER_REPO } from "../report.js";
+import { APP_CHANGES } from "../../changes.js";
 export function buildRegistry(ctx, endpoint, opts = {}) {
     const reg = new Registry(ctx);
     const openUrl = opts.openUrl ?? defaultOpenUrl;
@@ -23,12 +24,18 @@ export function buildRegistry(ctx, endpoint, opts = {}) {
                 return ["no request errors logged — everything's green ✓"];
             return errs.map((e) => `${new Date(e.ts).toISOString()} ${e.status} ${e.endpoint} ${e.model} — ${e.error ?? "(no message)"}`);
         } });
-    reg.add({ name: "/metrics", describe: "request metrics + recent errors", run: async (_a, c) => {
+    reg.add({ name: "/metrics", describe: "request metrics, tokens, cost + recent errors", run: async (_a, c) => {
             const reqs = await c.client.requests();
             const a = aggregate(reqs);
             if (!a.total)
                 return ["no requests yet"];
-            const lines = [`requests: ${a.total}  errors: ${a.errors}`, ...a.byModel.map((r) => `  ${r.model.padEnd(20)} n=${r.count} avg=${r.avgMs}ms`)];
+            const k = (n) => (n >= 1000 ? `${(n / 1000).toFixed(1)}k` : `${n}`);
+            const usd = (n) => `$${n < 1 ? n.toFixed(3) : n.toFixed(2)}`;
+            const lines = [
+                `requests: ${a.total}  errors: ${a.errors}  tokens: ${k(a.tokensIn)}↑ ${k(a.tokensOut)}↓  est. cost: ${usd(a.costUsd)}`,
+                ...a.byModel.map((r) => `  ${r.model.padEnd(20)} n=${r.count} avg=${r.avgMs}ms  ${k(r.tokensIn)}↑ ${k(r.tokensOut)}↓ ~${usd(r.costUsd)}`),
+                "  cost is a list-price estimate (Copilot is flat-fee)",
+            ];
             const errs = recentErrors(reqs, 5);
             if (errs.length) {
                 lines.push("recent errors:");
@@ -68,6 +75,17 @@ export function buildRegistry(ctx, endpoint, opts = {}) {
             openUrl(url);
             return [`opening a pre-filled GitHub issue for ${repo} in your browser…`];
         } });
+    reg.add({ name: "/changes", describe: "what's new — recent releases", run: async () => {
+            if (!APP_CHANGES.length)
+                return ["no changelog bundled"];
+            const lines = APP_CHANGES.slice(0, 10).map((c) => {
+                const s = c.summary.length > 90 ? c.summary.slice(0, 87) + "…" : c.summary;
+                return `v${c.version} (${c.date}) — ${s}`;
+            });
+            const repo = opts.reportRepo && opts.reportRepo !== PLACEHOLDER_REPO ? opts.reportRepo : "wangcansunking/copilot-reverse";
+            lines.push("", `full changelog: https://github.com/${repo}/blob/master/CHANGELOG.md`);
+            return lines;
+        } });
     reg.add({ name: "/quit", describe: "exit copilot-reverse", run: async (_a, c) => { c.quit(); return ["bye"]; } });
     reg.add({ name: "/help", describe: "list commands", run: async () => reg.list().map((c) => `${c.name.padEnd(14)} ${c.describe}`) });
     return reg;

package/dist/version.js CHANGED Viewed

@@ -1,2 +1,2 @@
 // AUTO-GENERATED by scripts/gen-version.mjs from package.json — do not edit.
-export const APP_VERSION = "0.5.5";
+export const APP_VERSION = "0.7.0";

package/dist/worker/anthropic-server.js CHANGED Viewed

@@ -35,7 +35,7 @@ export function mountAnthropic(app, router, onMetric, runner) {
         const canon = anthropicRequestToCanonical(req.body);
         canon.model = router.resolveModel(canon.model);
         const provider = router.pick(canon.model);
-        const metric = (status, error) => onMetric({ endpoint: "/anthropic/v1/messages", model: canon.model, status, latencyMs: Date.now() - start, error });
+        const metric = (status, opts = {}) => onMetric({ endpoint: "/anthropic/v1/messages", model: canon.model, status, latencyMs: Date.now() - start, tokensIn: opts.tokensIn, tokensOut: opts.tokensOut, error: opts.error });
         try {
             if (canon.stream) {
                 res.setHeader("content-type", "text/event-stream");
@@ -157,7 +157,7 @@ export function mountAnthropic(app, router, onMetric, runner) {
                 res.write(frame("message_delta", { type: "message_delta", delta: { stop_reason: finalStop === "tool_use" ? "tool_use" : finalStop === "length" ? "max_tokens" : "end_turn" }, usage: deltaUsage }));
                 res.write(frame("message_stop", { type: "message_stop" }));
                 res.end();
-                metric(200, runaway ? `runaway stream cut (${runawayReason}) — model degenerated, ended early as max_tokens` : undefined);
+                metric(200, { tokensIn: inputTokens, tokensOut: sumCompletion, error: runaway ? `runaway stream cut (${runawayReason}) — model degenerated, ended early as max_tokens` : undefined });
             }
             else {
                 // Non-stream: same gateway loop without SSE — run gateway tools and re-complete until the
@@ -182,7 +182,7 @@ export function mountAnthropic(app, router, onMetric, runner) {
                 if (runner)
                     resp = { ...resp, content: resp.content.filter((b) => b.type !== "tool_use" || !isGatewayTool(b.name)) };
                 res.json(canonicalToAnthropicResponse(resp));
-                metric(200);
+                metric(200, { tokensIn: resp.usage?.promptTokens, tokensOut: resp.usage?.completionTokens });
             }
         }
         catch (err) {
@@ -201,7 +201,7 @@ export function mountAnthropic(app, router, onMetric, runner) {
                 res.write(frame("error", { type: "error", error: { type: errorType, message } }));
                 res.end();
             }
-            metric(status, message);
+            metric(status, { error: message });
         }
     });
 }

package/dist/worker/openai-server.js CHANGED Viewed

@@ -18,7 +18,7 @@ export function mountOpenAI(app, router, onMetric) {
         const canon = openaiRequestToCanonical(req.body);
         canon.model = router.resolveModel(canon.model);
         const provider = router.pick(canon.model);
-        const metric = (status, error) => onMetric({ endpoint: "/openai/chat/completions", model: canon.model, status, latencyMs: Date.now() - start, error });
+        const metric = (status, opts = {}) => onMetric({ endpoint: "/openai/chat/completions", model: canon.model, status, latencyMs: Date.now() - start, tokensIn: opts.tokensIn, tokensOut: opts.tokensOut, error: opts.error });
         try {
             if (canon.stream) {
                 res.setHeader("content-type", "text/event-stream");
@@ -27,8 +27,11 @@ export function mountOpenAI(app, router, onMetric) {
                 const guard = new RunawayGuard();
                 const deadline = start + STREAM_DEADLINE_MS;
                 let runawayReason = "";
+                let usage;
                 for await (const chunk of provider.stream(canon)) {
                     res.write(canonicalChunkToOpenAISSE(chunk, id, canon.model));
+                    if (chunk.done)
+                        usage = chunk.usage;
                     // Backstop covers tool-call streams too: a model can loop on tool calls forever, which
                     // never feeds the text guard — the wall clock cuts those cleanly instead of freezing.
                     if (chunk.kind === "text" && guard.push(chunk.delta)) {
@@ -41,11 +44,12 @@ export function mountOpenAI(app, router, onMetric) {
                     }
                 }
                 res.end();
-                metric(200, runawayReason ? `runaway stream cut (${runawayReason}) — model degenerated, ended early` : undefined);
+                metric(200, { tokensIn: usage?.promptTokens, tokensOut: usage?.completionTokens, error: runawayReason ? `runaway stream cut (${runawayReason}) — model degenerated, ended early` : undefined });
             }
             else {
-                res.json(canonicalToOpenAIResponse(await provider.complete(canon)));
-                metric(200);
+                const resp = await provider.complete(canon);
+                res.json(canonicalToOpenAIResponse(resp));
+                metric(200, { tokensIn: resp.usage?.promptTokens, tokensOut: resp.usage?.completionTokens });
             }
         }
         catch (err) {
@@ -62,7 +66,7 @@ export function mountOpenAI(app, router, onMetric) {
                 res.write(`data: ${JSON.stringify({ error: { message } })}\n\n`);
                 res.end();
             }
-            metric(status, message);
+            metric(status, { error: message });
         }
     });
     // OpenAI Responses API — Codex speaks ONLY this after codex#7782 removed wire_api="chat". Codex
@@ -73,7 +77,7 @@ export function mountOpenAI(app, router, onMetric) {
         const canon = responsesRequestToCanonical(req.body);
         canon.model = router.resolveModel(canon.model);
         const provider = router.pick(canon.model);
-        const metric = (status, error) => onMetric({ endpoint: "/openai/responses", model: canon.model, status, latencyMs: Date.now() - start, error });
+        const metric = (status, opts = {}) => onMetric({ endpoint: "/openai/responses", model: canon.model, status, latencyMs: Date.now() - start, tokensIn: opts.tokensIn, tokensOut: opts.tokensOut, error: opts.error });
         try {
             if (canon.stream) {
                 res.setHeader("content-type", "text/event-stream");
@@ -119,11 +123,12 @@ export function mountOpenAI(app, router, onMetric) {
                 for (const f of sse.finish(usage, finish, argsByIdx))
                     res.write(f);
                 res.end();
-                metric(200, runawayReason ? `runaway stream cut (${runawayReason}) — model degenerated, ended early` : undefined);
+                metric(200, { tokensIn: usage?.promptTokens, tokensOut: usage?.completionTokens, error: runawayReason ? `runaway stream cut (${runawayReason}) — model degenerated, ended early` : undefined });
             }
             else {
-                res.json(canonicalToResponsesResponse(await provider.complete(canon)));
-                metric(200);
+                const resp = await provider.complete(canon);
+                res.json(canonicalToResponsesResponse(resp));
+                metric(200, { tokensIn: resp.usage?.promptTokens, tokensOut: resp.usage?.completionTokens });
             }
         }
         catch (err) {
@@ -138,7 +143,7 @@ export function mountOpenAI(app, router, onMetric) {
                 res.write(`data: ${JSON.stringify({ type: "error", message })}\n\n`);
                 res.end();
             }
-            metric(status, message);
+            metric(status, { error: message });
         }
     });
 }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "copilot-reverse",
-  "version": "0.5.5",
+  "version": "0.7.0",
   "description": "Interactive terminal app that exposes your GitHub Copilot subscription as local OpenAI- and Anthropic-compatible endpoints, with a self-healing daemon and a built-in assistant.",
   "type": "module",
   "license": "MIT",
@@ -32,7 +32,7 @@
     "llm"
   ],
   "scripts": {
-    "prebuild": "node scripts/gen-version.mjs",
+    "prebuild": "node scripts/gen-version.mjs && node scripts/gen-changes.mjs",
     "build": "tsc -p tsconfig.json",
     "test": "vitest run",
     "test:coverage": "vitest run --coverage",