npm - @dianshuv/copilot-api - Versions diffs - 0.4.3 → 0.6.0 - Mend

@dianshuv/copilot-api 0.4.3 → 0.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/README.md CHANGED Viewed

@@ -15,6 +15,7 @@
 - **Graceful shutdown**: 4-phase shutdown sequence — stops accepting requests, waits for in-flight requests to complete, sends abort signal, then force-closes. Configurable via `--shutdown-graceful-wait` and `--shutdown-abort-wait`.
 - **Stream repetition detection**: Detects when models get stuck in repetitive output loops using KMP-based pattern matching and logs a warning.
 - **Stale request reaping**: Automatically force-fails requests that exceed a configurable maximum age (default 600s) to prevent resource leaks.
+- **PostHog analytics**: Optional PostHog Cloud integration (`--posthog-key`) sends per-request token usage events for long-term trend analysis. Free tier (1M events/month) is more than sufficient for individual use.
 ## Quick Start
@@ -66,6 +67,7 @@ copilot-api start
 | `--redirect-anthropic` | Force Anthropic through OpenAI translation | false |
 | `--no-rewrite-anthropic-tools` | Don't rewrite server-side tools | false |
 | `--timezone-offset` | Timezone offset in hours from UTC for log timestamps (e.g., +8, -5, 0) | +8 |
+| `--posthog-key` | PostHog API key for token usage analytics (opt-in) | none |
 ### Patch-Claude Command Options

package/dist/main.mjs CHANGED Viewed

@@ -4,11 +4,12 @@ import consola from "consola";
 import fs from "node:fs/promises";
 import os from "node:os";
 import path, { dirname, join } from "node:path";
-import { randomUUID } from "node:crypto";
+import { createHash, randomUUID } from "node:crypto";
 import { existsSync, readFileSync, readdirSync, writeFileSync } from "node:fs";
 import clipboard from "clipboardy";
 import { serve } from "srvx";
 import invariant from "tiny-invariant";
+import { PostHog } from "posthog-node";
 import { getProxyForUrl } from "proxy-from-env";
 import { Agent, ProxyAgent, setGlobalDispatcher } from "undici";
 import { execSync } from "node:child_process";
@@ -68,7 +69,14 @@ const EDITOR_PLUGIN_VERSION = `copilot-chat/${COPILOT_VERSION}`;
 const USER_AGENT = `GitHubCopilotChat/${COPILOT_VERSION}`;
 const API_VERSION = "2025-04-01";
 const copilotBaseUrl = (state) => state.accountType === "individual" ? "https://api.githubcopilot.com" : `https://api.${state.accountType}.githubcopilot.com`;
-const copilotHeaders = (state, vision = false) => {
+function hasHeaderKey(headers, key) {
+	const lowerKey = key.toLowerCase();
+	return Object.keys(headers).some((existingKey) => {
+		return existingKey.toLowerCase() === lowerKey;
+	});
+}
+function copilotHeaders(state, visionOrOptions) {
+	const options = typeof visionOrOptions === "boolean" ? { vision: visionOrOptions } : visionOrOptions ?? {};
 	const headers = {
 		Authorization: `Bearer ${state.copilotToken}`,
 		"content-type": standardHeaders()["content-type"],
@@ -76,14 +84,15 @@ const copilotHeaders = (state, vision = false) => {
 		"editor-version": `vscode/${state.vsCodeVersion}`,
 		"editor-plugin-version": EDITOR_PLUGIN_VERSION,
 		"user-agent": USER_AGENT,
-		"openai-intent": "conversation-panel",
+		"openai-intent": options.intent ?? "conversation-panel",
 		"x-github-api-version": API_VERSION,
 		"x-request-id": randomUUID(),
 		"x-vscode-user-agent-library-version": "electron-fetch"
 	};
-	if (vision) headers["copilot-vision-request"] = "true";
+	for (const [key, value] of Object.entries(options.modelRequestHeaders ?? {})) if (!hasHeaderKey(headers, key)) headers[key] = value;
+	if (options.vision) headers["copilot-vision-request"] = "true";
 	return headers;
-};
+}
 const GITHUB_API_BASE_URL = "https://api.github.com";
 const githubHeaders = (state) => ({
 	...standardHeaders(),
@@ -208,6 +217,10 @@ function formatRateLimitError(copilotMessage) {
 		}
 	};
 }
+function truncateForLog(text, maxLen) {
+	if (text.length <= maxLen) return text;
+	return `${text.slice(0, maxLen)}...`;
+}
 function forwardError(c, error) {
 	if (error instanceof HTTPError) {
 		if (error.status === 413) {
@@ -246,7 +259,9 @@ function forwardError(c, error) {
 			consola.warn(`HTTP 429: Rate limit exceeded`);
 			return c.json(formattedError, 429);
 		}
-		consola.error(`HTTP ${error.status}:`, errorJson);
+		let loggedError = errorJson;
+		if (typeof errorJson === "string") loggedError = errorJson.trimStart().startsWith("<") ? `[HTML ${errorJson.length} bytes]` : truncateForLog(errorJson, 200);
+		consola.error(`HTTP ${error.status}:`, loggedError);
 		return c.json({ error: {
 			message: error.responseText,
 			type: "error"
@@ -1021,7 +1036,7 @@ const patchClaude = defineCommand({
 //#endregion
 //#region package.json
-var version = "0.4.3";
+var version = "0.6.0";
 //#endregion
 //#region src/lib/adaptive-rate-limiter.ts
@@ -1933,6 +1948,55 @@ function exportHistory(format = "json") {
 	return [headers.join(","), ...rows.map((r) => r.join(","))].join("\n");
 }
+//#endregion
+//#region src/lib/posthog.ts
+let client = null;
+let distinctId = "";
+function initPostHog(apiKey) {
+	if (!apiKey) return;
+	try {
+		client = new PostHog(apiKey, {
+			host: "https://us.i.posthog.com",
+			flushAt: 20,
+			flushInterval: 1e4
+		});
+		distinctId = createHash("sha256").update(os.hostname() + os.userInfo().username).digest("hex");
+	} catch (error) {
+		consola.warn("Failed to initialize PostHog:", error instanceof Error ? error.message : error);
+		client = null;
+	}
+}
+function isPostHogEnabled() {
+	return client !== null;
+}
+function captureRequest(params) {
+	if (!client) return;
+	const properties = {
+		model: params.model,
+		input_tokens: params.inputTokens,
+		output_tokens: params.outputTokens,
+		duration_ms: params.durationMs,
+		success: params.success,
+		stream: params.stream,
+		tool_count: params.toolCount
+	};
+	if (params.reasoningTokens !== void 0) properties.reasoning_tokens = params.reasoningTokens;
+	if (params.stopReason !== void 0) properties.stop_reason = params.stopReason;
+	client.capture({
+		distinctId,
+		event: "copilot_api_request",
+		properties
+	});
+}
+async function shutdownPostHog() {
+	if (!client) return;
+	try {
+		await client.shutdown();
+	} catch (error) {
+		consola.warn("Failed to flush PostHog events:", error instanceof Error ? error.message : error);
+	}
+}
 //#endregion
 //#region src/lib/proxy.ts
 /**
@@ -2143,7 +2207,7 @@ async function gracefulShutdown(signal, deps) {
 			try {
 				if (await drainActiveRequests(gracefulWaitMs, tracker, drainOpts) === "drained") {
 					consola.info("All requests completed naturally");
-					finalize(tracker);
+					await finalize(tracker);
 					return;
 				}
 			} catch (error) {
@@ -2155,7 +2219,7 @@ async function gracefulShutdown(signal, deps) {
 			try {
 				if (await drainActiveRequests(abortWaitMs, tracker, drainOpts) === "drained") {
 					consola.info("All requests completed after abort signal");
-					finalize(tracker);
+					await finalize(tracker);
 					return;
 				}
 			} catch (error) {
@@ -2169,13 +2233,15 @@ async function gracefulShutdown(signal, deps) {
 				consola.error("Error force-closing server:", error);
 			}
 		}
-		finalize(tracker);
+		await finalize(tracker);
 	} else {
+		await shutdownPostHog();
 		consola.info("Shutdown complete");
 		shutdownResolve?.();
 	}
 }
-function finalize(tracker) {
+async function finalize(tracker) {
+	await shutdownPostHog();
 	tracker.destroy();
 	consola.info("Shutdown complete");
 	shutdownResolve?.();
@@ -2465,8 +2531,10 @@ var RequestTracker = class {
 		if (update.durationMs !== void 0) request.durationMs = update.durationMs;
 		if (update.inputTokens !== void 0) request.inputTokens = update.inputTokens;
 		if (update.outputTokens !== void 0) request.outputTokens = update.outputTokens;
+		if (update.reasoningTokens !== void 0) request.reasoningTokens = update.reasoningTokens;
 		if (update.error !== void 0) request.error = update.error;
 		if (update.queuePosition !== void 0) request.queuePosition = update.queuePosition;
+		if (update.queueWaitMs !== void 0) request.queueWaitMs = update.queueWaitMs;
 		this.renderer?.onRequestUpdate(id, update);
 	}
 	/**
@@ -2481,6 +2549,7 @@ var RequestTracker = class {
 		if (usage) {
 			request.inputTokens = usage.inputTokens;
 			request.outputTokens = usage.outputTokens;
+			if (usage.reasoningTokens !== void 0) request.reasoningTokens = usage.reasoningTokens;
 		}
 		this.renderer?.onRequestComplete(request);
 		this.requests.delete(id);
@@ -3281,6 +3350,26 @@ function createTruncationResponseMarkerOpenAI(result) {
 	return `\n\n---\n[Auto-truncated: ${result.removedMessageCount} messages removed, ${result.originalTokens} → ${result.compactedTokens} tokens (${percentage}% reduction)]`;
 }
+//#endregion
+//#region src/lib/message-sanitizer.ts
+const startPattern = /^\s*<system-reminder>[\s\S]*?<\/system-reminder>\n*/;
+const endPatternWithNewline = /\n+<system-reminder>[\s\S]*?<\/system-reminder>\s*$/;
+const endPatternOnly = /^\s*<system-reminder>[\s\S]*?<\/system-reminder>\s*$/;
+function removeSystemReminderTags(text) {
+	let result = text;
+	let prev;
+	do {
+		prev = result;
+		result = result.replace(startPattern, "");
+	} while (result !== prev);
+	do {
+		prev = result;
+		result = result.replace(endPatternWithNewline, "");
+	} while (result !== prev);
+	result = result.replace(endPatternOnly, "");
+	return result;
+}
 //#endregion
 //#region src/lib/repetition-detector.ts
 /**
@@ -3409,7 +3498,10 @@ const createChatCompletions = async (payload, options) => {
 	const enableVision = payload.messages.some((x) => typeof x.content !== "string" && x.content?.some((x) => x.type === "image_url"));
 	const isAgentCall = payload.messages.some((msg) => ["assistant", "tool"].includes(msg.role));
 	const headers = {
-		...copilotHeaders(state, enableVision),
+		...copilotHeaders(state, {
+			vision: enableVision,
+			intent: isAgentCall ? "conversation-agent" : "conversation-panel"
+		}),
 		"X-Initiator": options?.initiator ?? (isAgentCall ? "agent" : "user")
 	};
 	const response = await fetch(`${copilotBaseUrl(state)}/chat/completions`, {
@@ -3463,17 +3555,30 @@ function recordErrorResponse(ctx, model, error) {
 		content: null
 	}, Date.now() - ctx.startTime);
 }
-/** Complete TUI tracking */
-function completeTracking(trackingId, inputTokens, outputTokens, queueWaitMs) {
+/** Complete TUI tracking and send PostHog analytics */
+function completeTracking(trackingId, inputTokens, outputTokens, queueWaitMs, reasoningTokens, analytics) {
 	if (!trackingId) return;
 	requestTracker.updateRequest(trackingId, {
 		inputTokens,
 		outputTokens,
-		queueWaitMs
+		queueWaitMs,
+		reasoningTokens
 	});
 	requestTracker.completeRequest(trackingId, 200, {
 		inputTokens,
-		outputTokens
+		outputTokens,
+		reasoningTokens
+	});
+	if (analytics) captureRequest({
+		model: analytics.model,
+		inputTokens,
+		outputTokens,
+		durationMs: analytics.durationMs,
+		success: true,
+		stream: analytics.stream,
+		toolCount: analytics.toolCount ?? 0,
+		reasoningTokens,
+		stopReason: analytics.stopReason
 	});
 }
 /** Fail TUI tracking */
@@ -3593,6 +3698,9 @@ async function logPayloadSizeInfo(payload, model) {
 //#endregion
 //#region src/routes/chat-completions/handler.ts
+function getReasoningTokensFromOpenAIUsage(usage) {
+	return usage?.completion_tokens_details?.reasoning_tokens;
+}
 async function handleCompletion$1(c) {
 	const originalPayload = await c.req.json();
 	consola.debug("Request payload:", JSON.stringify(originalPayload).slice(-400));
@@ -3640,7 +3748,7 @@ async function executeRequest(opts) {
 	try {
 		const { result: response, queueWaitMs } = await executeWithAdaptiveRateLimit(() => createChatCompletions(payload));
 		ctx.queueWaitMs = queueWaitMs;
-		if (isNonStreaming(response)) return handleNonStreamingResponse$1(c, response, ctx);
+		if (isNonStreaming(response)) return handleNonStreamingResponse$1(c, response, ctx, payload);
 		consola.debug("Streaming response");
 		updateTrackerStatus(trackingId, "streaming");
 		return streamSSE(c, async (stream) => {
@@ -3667,7 +3775,7 @@ async function logTokenCount(payload, selectedModel) {
 		consola.debug("Failed to calculate token count:", error);
 	}
 }
-function handleNonStreamingResponse$1(c, originalResponse, ctx) {
+function handleNonStreamingResponse$1(c, originalResponse, ctx, payload) {
 	consola.debug("Non-streaming response:", JSON.stringify(originalResponse));
 	let response = originalResponse;
 	if (state.verbose && ctx.truncateResult?.wasCompacted && response.choices[0]?.message.content) {
@@ -3685,21 +3793,36 @@ function handleNonStreamingResponse$1(c, originalResponse, ctx) {
 	}
 	const choice = response.choices[0];
 	const usage = response.usage;
+	const reasoningTokens = getReasoningTokensFromOpenAIUsage(usage);
+	const durationMs = Date.now() - ctx.startTime;
 	recordResponse(ctx.historyId, {
 		success: true,
 		model: response.model,
 		usage: {
 			input_tokens: usage?.prompt_tokens ?? 0,
-			output_tokens: usage?.completion_tokens ?? 0
+			output_tokens: usage?.completion_tokens ?? 0,
+			...reasoningTokens !== void 0 ? { output_tokens_details: { reasoning_tokens: reasoningTokens } } : {}
 		},
 		stop_reason: choice.finish_reason,
 		content: buildResponseContent(choice),
 		toolCalls: extractToolCalls(choice)
-	}, Date.now() - ctx.startTime);
+	}, durationMs);
 	if (ctx.trackingId && usage) requestTracker.updateRequest(ctx.trackingId, {
 		inputTokens: usage.prompt_tokens,
 		outputTokens: usage.completion_tokens,
-		queueWaitMs: ctx.queueWaitMs
+		queueWaitMs: ctx.queueWaitMs,
+		reasoningTokens
+	});
+	captureRequest({
+		model: response.model,
+		inputTokens: usage?.prompt_tokens ?? 0,
+		outputTokens: usage?.completion_tokens ?? 0,
+		durationMs,
+		success: true,
+		stream: false,
+		toolCount: payload.tools?.length ?? 0,
+		reasoningTokens,
+		stopReason: choice.finish_reason
 	});
 	return c.json(response);
 }
@@ -3729,6 +3852,7 @@ function createStreamAccumulator() {
 		model: "",
 		inputTokens: 0,
 		outputTokens: 0,
+		reasoningTokens: 0,
 		finishReason: "",
 		content: "",
 		toolCalls: [],
@@ -3766,7 +3890,13 @@ async function handleStreamingResponse$1(opts) {
 			await stream.writeSSE(chunk);
 		}
 		recordStreamSuccess(acc, payload.model, ctx);
-		completeTracking(ctx.trackingId, acc.inputTokens, acc.outputTokens, ctx.queueWaitMs);
+		completeTracking(ctx.trackingId, acc.inputTokens, acc.outputTokens, ctx.queueWaitMs, acc.reasoningTokens, {
+			model: acc.model || payload.model,
+			stream: true,
+			durationMs: Date.now() - ctx.startTime,
+			stopReason: acc.finishReason || void 0,
+			toolCount: payload.tools?.length ?? 0
+		});
 	} catch (error) {
 		recordStreamError({
 			acc,
@@ -3786,6 +3916,7 @@ function parseStreamChunk(chunk, acc, checkRepetition) {
 		if (parsed.usage) {
 			acc.inputTokens = parsed.usage.prompt_tokens;
 			acc.outputTokens = parsed.usage.completion_tokens;
+			acc.reasoningTokens = getReasoningTokensFromOpenAIUsage(parsed.usage) ?? 0;
 		}
 		const choice = parsed.choices[0];
 		if (choice) {
@@ -3826,7 +3957,8 @@ function recordStreamSuccess(acc, fallbackModel, ctx) {
 		model: acc.model || fallbackModel,
 		usage: {
 			input_tokens: acc.inputTokens,
-			output_tokens: acc.outputTokens
+			output_tokens: acc.outputTokens,
+			...acc.reasoningTokens > 0 ? { output_tokens_details: { reasoning_tokens: acc.reasoningTokens } } : {}
 		},
 		stop_reason: acc.finishReason || void 0,
 		content: {
@@ -3845,7 +3977,7 @@ function convertOpenAIMessages(messages) {
 	return messages.map((msg) => {
 		const result = {
 			role: msg.role,
-			content: typeof msg.content === "string" ? msg.content : JSON.stringify(msg.content)
+			content: typeof msg.content === "string" ? removeSystemReminderTags(msg.content) : JSON.stringify(msg.content)
 		};
 		if ("tool_calls" in msg && msg.tool_calls) result.tool_calls = msg.tool_calls.map((tc) => ({
 			id: tc.id,
@@ -6006,7 +6138,10 @@ async function createAnthropicMessages(payload, options) {
 	});
 	const isAgentCall = filteredPayload.messages.some((msg) => msg.role === "assistant");
 	const headers = {
-		...copilotHeaders(state, enableVision),
+		...copilotHeaders(state, {
+			vision: enableVision,
+			intent: isAgentCall ? "conversation-agent" : "conversation-panel"
+		}),
 		"X-Initiator": options?.initiator ?? (isAgentCall ? "agent" : "user"),
 		"anthropic-version": "2023-06-01"
 	};
@@ -6141,12 +6276,12 @@ function convertAnthropicMessages(messages) {
 	return messages.map((msg) => {
 		if (typeof msg.content === "string") return {
 			role: msg.role,
-			content: msg.content
+			content: removeSystemReminderTags(msg.content)
 		};
 		const content = msg.content.map((block) => {
 			if (block.type === "text") return {
 				type: "text",
-				text: block.text
+				text: removeSystemReminderTags(block.text)
 			};
 			if (block.type === "tool_use") return {
 				type: "tool_use",
@@ -6213,9 +6348,13 @@ function createAnthropicStreamAccumulator() {
 		stopReason: "",
 		content: "",
 		toolCalls: [],
+		serverToolResults: [],
 		currentToolCall: null
 	};
 }
+function isServerToolResultType(type) {
+	return type !== "tool_result" && type.endsWith("_tool_result");
+}
 function processAnthropicEvent(event, acc) {
 	switch (event.type) {
 		case "content_block_delta":
@@ -6238,11 +6377,14 @@ function handleContentBlockDelta(delta, acc) {
 	else if (delta.type === "input_json_delta" && acc.currentToolCall) acc.currentToolCall.input += delta.partial_json;
 }
 function handleContentBlockStart(block, acc) {
-	if (block.type === "tool_use") acc.currentToolCall = {
-		id: block.id,
-		name: block.name,
-		input: ""
-	};
+	if (block.type === "tool_use") {
+		const toolBlock = block;
+		acc.currentToolCall = {
+			id: toolBlock.id,
+			name: toolBlock.name,
+			input: ""
+		};
+	} else if (isServerToolResultType(block.type)) acc.serverToolResults.push(block);
 }
 function handleContentBlockStop(acc) {
 	if (acc.currentToolCall) {
@@ -6257,6 +6399,32 @@ function handleMessageDelta(delta, usage, acc) {
 		acc.outputTokens = usage.output_tokens;
 	}
 }
+function recordAnthropicStreamingResponse(acc, fallbackModel, ctx) {
+	const contentBlocks = [];
+	if (acc.content) contentBlocks.push({
+		type: "text",
+		text: acc.content
+	});
+	for (const tc of acc.toolCalls) contentBlocks.push({
+		type: "tool_use",
+		...tc
+	});
+	for (const result of acc.serverToolResults) contentBlocks.push(result);
+	recordResponse(ctx.historyId, {
+		success: true,
+		model: acc.model || fallbackModel,
+		usage: {
+			input_tokens: acc.inputTokens,
+			output_tokens: acc.outputTokens
+		},
+		stop_reason: acc.stopReason || void 0,
+		content: contentBlocks.length > 0 ? {
+			role: "assistant",
+			content: contentBlocks
+		} : null,
+		toolCalls: acc.toolCalls.length > 0 ? acc.toolCalls : void 0
+	}, Date.now() - ctx.startTime);
+}
 //#endregion
 //#region src/routes/messages/non-stream-translation.ts
@@ -6762,7 +6930,7 @@ async function handleDirectAnthropicCompletion(c, anthropicPayload, ctx, initiat
 				});
 			});
 		}
-		return handleDirectAnthropicNonStreamingResponse(c, response, ctx, truncateResult);
+		return handleDirectAnthropicNonStreamingResponse(c, response, ctx, truncateResult, effectivePayload);
 	} catch (error) {
 		if (error instanceof HTTPError && error.status === 413) logPayloadSizeInfoAnthropic(effectivePayload, selectedModel);
 		recordErrorResponse(ctx, anthropicPayload.model, error);
@@ -6787,7 +6955,7 @@ function logPayloadSizeInfoAnthropic(payload, model) {
 /**
 * Handle non-streaming direct Anthropic response
 */
-function handleDirectAnthropicNonStreamingResponse(c, response, ctx, truncateResult) {
+function handleDirectAnthropicNonStreamingResponse(c, response, ctx, truncateResult, payload) {
 	consola.debug("Non-streaming response from Copilot (direct Anthropic):", JSON.stringify(response).slice(-400));
 	recordResponse(ctx.historyId, {
 		success: true,
@@ -6823,6 +6991,16 @@ function handleDirectAnthropicNonStreamingResponse(c, response, ctx, truncateRes
 		outputTokens: response.usage.output_tokens,
 		queueWaitMs: ctx.queueWaitMs
 	});
+	captureRequest({
+		model: response.model,
+		inputTokens: response.usage.input_tokens,
+		outputTokens: response.usage.output_tokens,
+		durationMs: Date.now() - ctx.startTime,
+		success: true,
+		stream: false,
+		toolCount: payload.tools?.length ?? 0,
+		stopReason: response.stop_reason ?? void 0
+	});
 	let finalResponse = response;
 	if (state.verbose && truncateResult?.wasCompacted) finalResponse = prependMarkerToAnthropicResponse$1(response, createTruncationMarker$1(truncateResult));
 	return c.json(finalResponse);
@@ -6875,8 +7053,14 @@ async function handleDirectAnthropicStreamingResponse(opts) {
 				data: rawEvent.data
 			});
 		}
-		recordStreamingResponse$1(acc, anthropicPayload.model, ctx);
-		completeTracking(ctx.trackingId, acc.inputTokens, acc.outputTokens, ctx.queueWaitMs);
+		recordAnthropicStreamingResponse(acc, anthropicPayload.model, ctx);
+		completeTracking(ctx.trackingId, acc.inputTokens, acc.outputTokens, ctx.queueWaitMs, void 0, {
+			model: acc.model || anthropicPayload.model,
+			stream: true,
+			durationMs: Date.now() - ctx.startTime,
+			stopReason: acc.stopReason || void 0,
+			toolCount: anthropicPayload.tools?.length ?? 0
+		});
 	} catch (error) {
 		consola.error("Direct Anthropic stream error:", error);
 		recordStreamError({
@@ -6893,31 +7077,6 @@ async function handleDirectAnthropicStreamingResponse(opts) {
 		});
 	}
 }
-function recordStreamingResponse$1(acc, fallbackModel, ctx) {
-	const contentBlocks = [];
-	if (acc.content) contentBlocks.push({
-		type: "text",
-		text: acc.content
-	});
-	for (const tc of acc.toolCalls) contentBlocks.push({
-		type: "tool_use",
-		...tc
-	});
-	recordResponse(ctx.historyId, {
-		success: true,
-		model: acc.model || fallbackModel,
-		usage: {
-			input_tokens: acc.inputTokens,
-			output_tokens: acc.outputTokens
-		},
-		stop_reason: acc.stopReason || void 0,
-		content: contentBlocks.length > 0 ? {
-			role: "assistant",
-			content: contentBlocks
-		} : null,
-		toolCalls: acc.toolCalls.length > 0 ? acc.toolCalls : void 0
-	}, Date.now() - ctx.startTime);
-}
 //#endregion
 //#region src/routes/messages/subagent-marker.ts
@@ -6984,7 +7143,8 @@ async function handleTranslatedCompletion(c, anthropicPayload, ctx, initiatorOve
 			c,
 			response,
 			toolNameMapping,
-			ctx
+			ctx,
+			anthropicPayload
 		});
 		consola.debug("Streaming response from Copilot");
 		updateTrackerStatus(ctx.trackingId, "streaming");
@@ -7004,7 +7164,7 @@ async function handleTranslatedCompletion(c, anthropicPayload, ctx, initiatorOve
 	}
 }
 function handleNonStreamingResponse(opts) {
-	const { c, response, toolNameMapping, ctx } = opts;
+	const { c, response, toolNameMapping, ctx, anthropicPayload } = opts;
 	consola.debug("Non-streaming response from Copilot:", JSON.stringify(response).slice(-400));
 	let anthropicResponse = translateToAnthropic(response, toolNameMapping);
 	consola.debug("Translated Anthropic response:", JSON.stringify(anthropicResponse));
@@ -7040,6 +7200,16 @@ function handleNonStreamingResponse(opts) {
 		outputTokens: anthropicResponse.usage.output_tokens,
 		queueWaitMs: ctx.queueWaitMs
 	});
+	captureRequest({
+		model: anthropicResponse.model,
+		inputTokens: anthropicResponse.usage.input_tokens,
+		outputTokens: anthropicResponse.usage.output_tokens,
+		durationMs: Date.now() - ctx.startTime,
+		success: true,
+		stream: false,
+		toolCount: anthropicPayload.tools?.length ?? 0,
+		stopReason: anthropicResponse.stop_reason ?? void 0
+	});
 	return c.json(anthropicResponse);
 }
 function prependMarkerToAnthropicResponse(response, marker) {
@@ -7084,8 +7254,14 @@ async function handleStreamingResponse(opts) {
 			acc,
 			checkRepetition
 		});
-		recordStreamingResponse(acc, anthropicPayload.model, ctx);
-		completeTracking(ctx.trackingId, acc.inputTokens, acc.outputTokens, ctx.queueWaitMs);
+		recordAnthropicStreamingResponse(acc, anthropicPayload.model, ctx);
+		completeTracking(ctx.trackingId, acc.inputTokens, acc.outputTokens, ctx.queueWaitMs, void 0, {
+			model: acc.model || anthropicPayload.model,
+			stream: true,
+			durationMs: Date.now() - ctx.startTime,
+			stopReason: acc.stopReason || void 0,
+			toolCount: anthropicPayload.tools?.length ?? 0
+		});
 	} catch (error) {
 		consola.error("Stream error:", error);
 		recordStreamError({
@@ -7163,31 +7339,6 @@ async function processStreamChunks(opts) {
 		}
 	}
 }
-function recordStreamingResponse(acc, fallbackModel, ctx) {
-	const contentBlocks = [];
-	if (acc.content) contentBlocks.push({
-		type: "text",
-		text: acc.content
-	});
-	for (const tc of acc.toolCalls) contentBlocks.push({
-		type: "tool_use",
-		...tc
-	});
-	recordResponse(ctx.historyId, {
-		success: true,
-		model: acc.model || fallbackModel,
-		usage: {
-			input_tokens: acc.inputTokens,
-			output_tokens: acc.outputTokens
-		},
-		stop_reason: acc.stopReason || void 0,
-		content: contentBlocks.length > 0 ? {
-			role: "assistant",
-			content: contentBlocks
-		} : null,
-		toolCalls: acc.toolCalls.length > 0 ? acc.toolCalls : void 0
-	}, Date.now() - ctx.startTime);
-}
 //#endregion
 //#region src/routes/messages/handler.ts
@@ -7361,7 +7512,7 @@ modelRoutes.get("/", async (c) => {
 const createResponses = async (payload, { vision, initiator }) => {
 	if (!state.copilotToken) throw new Error("Copilot token not found");
 	const headers = {
-		...copilotHeaders(state, vision),
+		...copilotHeaders(state, { vision }),
 		"X-Initiator": initiator
 	};
 	payload.service_tier = null;
@@ -7633,7 +7784,12 @@ const handleResponses = async (c) => {
 					if (finalResult) {
 						recordResponseResult(finalResult, model, historyId, startTime);
 						const usage = finalResult.usage;
-						completeTracking(trackingId, usage?.input_tokens ?? 0, usage?.output_tokens ?? 0, queueWaitMs);
+						completeTracking(trackingId, usage?.input_tokens ?? 0, usage?.output_tokens ?? 0, queueWaitMs, usage?.output_tokens_details?.reasoning_tokens, {
+							model: finalResult.model || model,
+							stream: true,
+							durationMs: Date.now() - startTime,
+							toolCount: tools.length
+						});
 					} else if (streamErrorMessage) {
 						recordResponse(historyId, {
 							success: false,
@@ -7662,7 +7818,12 @@ const handleResponses = async (c) => {
 		const result = response;
 		const usage = result.usage;
 		recordResponseResult(result, model, historyId, startTime);
-		completeTracking(trackingId, usage?.input_tokens ?? 0, usage?.output_tokens ?? 0, ctx.queueWaitMs);
+		completeTracking(trackingId, usage?.input_tokens ?? 0, usage?.output_tokens ?? 0, ctx.queueWaitMs, usage?.output_tokens_details?.reasoning_tokens, {
+			model: result.model || model,
+			stream: false,
+			durationMs: Date.now() - startTime,
+			toolCount: tools.length
+		});
 		consola.debug("Forwarding native Responses result:", JSON.stringify(result).slice(-400));
 		return c.json(result);
 	} catch (error) {
@@ -7713,7 +7874,8 @@ function recordResponseResult(result, fallbackModel, historyId, startTime) {
 		model: result.model || fallbackModel,
 		usage: {
 			input_tokens: usage?.input_tokens ?? 0,
-			output_tokens: usage?.output_tokens ?? 0
+			output_tokens: usage?.output_tokens ?? 0,
+			...usage?.output_tokens_details ? { output_tokens_details: { reasoning_tokens: usage.output_tokens_details.reasoning_tokens } } : {}
 		},
 		stop_reason: extractResponseStopReason(result),
 		content,
@@ -7788,6 +7950,18 @@ server.route("/history", historyRoutes);
 //#endregion
 //#region src/start.ts
+const VALID_ACCOUNT_TYPES = [
+	"individual",
+	"business",
+	"enterprise"
+];
+function isValidAccountType(accountType) {
+	return VALID_ACCOUNT_TYPES.includes(accountType);
+}
+function validateAccountType(accountType) {
+	if (isValidAccountType(accountType)) return;
+	throw new Error(`Invalid account type: "${accountType}". Available: ${VALID_ACCOUNT_TYPES.join(", ")}`);
+}
 /** Format limit values as "Xk" or "?" if not available */
 function formatLimit(value) {
 	return value ? `${Math.round(value / 1e3)}k` : "?";
@@ -7810,6 +7984,12 @@ async function runServer(options) {
 		state.verbose = true;
 	}
 	state.accountType = options.accountType;
+	try {
+		validateAccountType(state.accountType);
+	} catch (error) {
+		consola.error(error instanceof Error ? error.message : String(error));
+		process.exit(1);
+	}
 	if (options.accountType !== "individual") consola.info(`Using ${options.accountType} plan GitHub account`);
 	state.manualApprove = options.manual;
 	state.showToken = options.showToken;
@@ -7834,6 +8014,10 @@ async function runServer(options) {
 		const limitText = options.historyLimit === 0 ? "unlimited" : `max ${options.historyLimit}`;
 		consola.info(`History recording enabled (${limitText} entries)`);
 	}
+	if (options.posthogKey) {
+		initPostHog(options.posthogKey);
+		if (isPostHogEnabled()) consola.info("PostHog analytics enabled");
+	}
 	initTui({ enabled: true });
 	initRequestContextManager(state.staleRequestMaxAge).startReaper();
 	await ensurePaths();
@@ -7843,7 +8027,13 @@ async function runServer(options) {
 		consola.info("Using provided GitHub token");
 	} else await setupGitHubToken();
 	await setupCopilotToken();
-	await cacheModels();
+	try {
+		await cacheModels();
+	} catch (error) {
+		consola.error(`Failed to fetch available models for account type "${state.accountType}". Check that the account type matches your Copilot plan.`);
+		consola.error(error instanceof Error ? error.message : String(error));
+		process.exit(1);
+	}
 	consola.info(`Available models:\n${state.models?.data.map((m) => formatModelInfo(m)).join("\n")}`);
 	const serverUrl = `http://${options.host ?? "localhost"}:${options.port}`;
 	if (options.claudeCode) {
@@ -8002,6 +8192,10 @@ const start = defineCommand({
 			type: "string",
 			default: "+8",
 			description: "Timezone offset in hours from UTC for log timestamps (e.g., +8, -5, 0)"
+		},
+		"posthog-key": {
+			type: "string",
+			description: "PostHog API key for token usage analytics (opt-in, no key = disabled)"
 		}
 	},
 	run({ args }) {
@@ -8026,7 +8220,8 @@ const start = defineCommand({
 			compressToolResults: args["compress-tool-results"],
 			redirectAnthropic: args["redirect-anthropic"],
 			rewriteAnthropicTools: !args["no-rewrite-anthropic-tools"],
-			timezoneOffset: parseTimezoneOffset(args["timezone-offset"])
+			timezoneOffset: parseTimezoneOffset(args["timezone-offset"]),
+			posthogKey: args["posthog-key"]
 		});
 	}
 });

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@dianshuv/copilot-api",
-  "version": "0.4.3",
+  "version": "0.6.0",
   "description": "Turn GitHub Copilot into OpenAI/Anthropic API compatible server. Usable with Claude Code!",
   "author": "dianshuv",
   "type": "module",
@@ -41,6 +41,7 @@
     "gpt-tokenizer": "^3.4.0",
     "hono": "^4.11.7",
     "picocolors": "^1.1.1",
+    "posthog-node": "^5.28.6",
     "proxy-from-env": "^1.1.0",
     "srvx": "^0.10.1",
     "tiny-invariant": "^1.3.3",