npm - @agi-cli/server - Versions diffs - 0.1.111 → 0.1.112 - Mend

@agi-cli/server 0.1.111 → 0.1.112

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/package.json +3 -3
package/src/runtime/db-operations.ts +3 -4
package/src/runtime/message-service.ts +7 -3
package/src/runtime/provider.ts +18 -1
package/src/runtime/runner.ts +5 -2

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
 	"name": "@agi-cli/server",
-	"version": "0.1.111",
+	"version": "0.1.112",
 	"description": "HTTP API server for AGI CLI",
 	"type": "module",
 	"main": "./src/index.ts",
@@ -29,8 +29,8 @@
 		"typecheck": "tsc --noEmit"
 	},
 	"dependencies": {
-		"@agi-cli/sdk": "0.1.111",
-		"@agi-cli/database": "0.1.111",
+		"@agi-cli/sdk": "0.1.112",
+		"@agi-cli/database": "0.1.112",
 		"drizzle-orm": "^0.44.5",
 		"hono": "^4.9.9",
 		"zod": "^4.1.8"

package/src/runtime/db-operations.ts CHANGED Viewed

@@ -173,10 +173,9 @@ export async function updateMessageTokensIncremental(
 					? Number(providerMetadata.openai.cachedPromptTokens)
 					: priorCached;
-		const cumTotal =
-			usage.totalTokens != null
-				? Number(usage.totalTokens)
-				: cumPrompt + cumCompletion + cumReasoning;
+		// Note: AI SDK's totalTokens excludes cachedInputTokens for Anthropic,
+		// so we always compute total ourselves to include all token types.
+		const cumTotal = cumPrompt + cumCompletion + cumCached + cumReasoning;
 		await db
 			.update(messages)

package/src/runtime/message-service.ts CHANGED Viewed

@@ -7,7 +7,7 @@ import { publish } from '../events/bus.ts';
 import { enqueueAssistantRun } from './session-queue.ts';
 import { runSessionLoop } from './runner.ts';
 import { resolveModel } from './provider.ts';
-import type { ProviderId } from '@agi-cli/sdk';
+import { getFastModel, type ProviderId } from '@agi-cli/sdk';
 import { debugLog } from './debug.ts';
 type SessionRow = typeof sessions.$inferSelect;
@@ -230,8 +230,6 @@ async function generateSessionTitle(args: {
 		debugLog('[TITLE_GEN] Generating title for session');
 		debugLog(`[TITLE_GEN] Provider: ${provider}, Model: ${modelName}`);
-		const model = await resolveModel(provider, modelName, cfg);
 		const { getAuth } = await import('@agi-cli/sdk');
 		const { getProviderSpoofPrompt } = await import('./prompt.ts');
 		const auth = await getAuth(provider, cfg.projectRoot);
@@ -240,6 +238,12 @@ async function generateSessionTitle(args: {
 			? getProviderSpoofPrompt(provider)
 			: undefined;
+		// Use a smaller, faster model for title generation
+		// Look up the cheapest/fastest model from the catalog for this provider
+		const titleModel = getFastModel(provider) ?? modelName;
+		debugLog(`[TITLE_GEN] Using title model: ${titleModel}`);
+		const model = await resolveModel(provider, titleModel, cfg);
 		debugLog(
 			`[TITLE_GEN] needsSpoof: ${needsSpoof}, spoofPrompt: ${spoofPrompt || 'NONE'}`,
 		);

package/src/runtime/provider.ts CHANGED Viewed

@@ -2,6 +2,7 @@ import type { AGIConfig, ProviderId } from '@agi-cli/sdk';
 import {
 	catalog,
 	createSolforgeModel,
+	createOpenAIOAuthModel,
 	getAuth,
 	refreshToken,
 	setAuth,
@@ -437,7 +438,23 @@ export async function resolveModel(
 	model: string,
 	cfg: AGIConfig,
 ) {
-	if (provider === 'openai') return openai(model);
+	if (provider === 'openai') {
+		const auth = await getAuth('openai', cfg.projectRoot);
+		if (auth?.type === 'oauth') {
+			const isCodexModel = model.toLowerCase().includes('codex');
+			return createOpenAIOAuthModel(model, {
+				oauth: auth,
+				projectRoot: cfg.projectRoot,
+				reasoningEffort: isCodexModel ? 'high' : 'medium',
+				reasoningSummary: 'auto',
+			});
+		}
+		if (auth?.type === 'api' && auth.key) {
+			const instance = createOpenAI({ apiKey: auth.key });
+			return instance(model);
+		}
+		return openai(model);
+	}
 	if (provider === 'anthropic') {
 		const instance = await getAnthropicInstance(cfg);
 		return instance(model);

package/src/runtime/runner.ts CHANGED Viewed

@@ -1,5 +1,5 @@
 import { hasToolCall, streamText } from 'ai';
-import { loadConfig, getAuth } from '@agi-cli/sdk';
+import { loadConfig } from '@agi-cli/sdk';
 import { getDb } from '@agi-cli/database';
 import { messageParts } from '@agi-cli/database/schema';
 import { eq } from 'drizzle-orm';
@@ -178,7 +178,10 @@ async function runAssistant(opts: RunOpts) {
 	// FIX: For OAuth, ALWAYS prepend the system message because it's never in history
 	// For API key mode, only add on first message (when additionalSystemMessages is empty)
-	const messagesWithSystemInstructions: any[] = [
+	const messagesWithSystemInstructions: Array<{
+		role: string;
+		content: string | Array<unknown>;
+	}> = [
 		...additionalSystemMessages, // Always add for OAuth, empty for API key mode
 		...history,
 	];