npm - @agi-cli/server - Versions diffs - 0.1.58 → 0.1.61 - Mend

@agi-cli/server 0.1.58 → 0.1.61

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/package.json +3 -3
package/src/index.ts +1 -1
package/src/openapi/spec.ts +641 -0
package/src/runtime/agent-registry.ts +3 -2
package/src/runtime/cache-optimizer.ts +93 -0
package/src/runtime/context-optimizer.ts +206 -0
package/src/runtime/db-operations.ts +173 -39
package/src/runtime/history-truncator.ts +26 -0
package/src/runtime/runner.ts +116 -240
package/src/runtime/session-manager.ts +2 -0
package/src/runtime/stream-handlers.ts +199 -184
package/src/tools/adapter.ts +261 -173

package/src/runtime/runner.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { hasToolCall, streamText } from 'ai';
+import { streamText } from 'ai';
 import { loadConfig } from '@agi-cli/sdk';
 import { getDb } from '@agi-cli/database';
 import { messageParts } from '@agi-cli/database/schema';
@@ -7,11 +7,8 @@ import { resolveModel } from './provider.ts';
 import { resolveAgentConfig } from './agent-registry.ts';
 import { composeSystemPrompt } from './prompt.ts';
 import { discoverProjectTools } from '@agi-cli/sdk';
-import { adaptTools } from '../tools/adapter.ts';
-import { publish, subscribe } from '../events/bus.ts';
-import { debugLog, time } from './debug.ts';
+import { publish } from '../events/bus.ts';
 import { buildHistoryMessages } from './history-builder.ts';
-import { toErrorPayload } from './error-handling.ts';
 import { getMaxOutputTokens } from './token-utils.ts';
 import {
 	type RunOpts,
@@ -22,14 +19,11 @@ import {
 	dequeueJob,
 	cleanupSession,
 } from './session-queue.ts';
+import { setupToolContext } from './tool-context-setup.ts';
 import {
-	setupToolContext,
-	type RunnerToolContext,
-} from './tool-context-setup.ts';
-import {
-	updateSessionTokens,
+	updateSessionTokensIncremental,
+	updateMessageTokensIncremental,
 	completeAssistantMessage,
-	cleanupEmptyTextParts,
 } from './db-operations.ts';
 import {
 	createStepFinishHandler,
@@ -37,175 +31,38 @@ import {
 	createAbortHandler,
 	createFinishHandler,
 } from './stream-handlers.ts';
+import { addCacheControl } from './cache-optimizer.ts';
+import { optimizeContext } from './context-optimizer.ts';
+import { truncateHistory } from './history-truncator.ts';
 /**
- * Enqueues an assistant run for processing.
- */
-export function enqueueAssistantRun(opts: Omit<RunOpts, 'abortSignal'>) {
-	enqueueRun(opts, processQueue);
-}
-/**
- * Aborts an active session.
+ * Main runner that executes the LLM streaming loop with tools
  */
-export function abortSession(sessionId: string) {
-	abortSessionQueue(sessionId);
-}
-/**
- * Processes the queue of assistant runs for a session.
- */
-async function processQueue(sessionId: string) {
-	const state = getRunnerState(sessionId);
-	if (!state) return;
-	if (state.running) return;
-	setRunning(sessionId, true);
-	while (state.queue.length > 0) {
-		const job = dequeueJob(sessionId);
-		if (!job) break;
-		try {
-			await runAssistant(job);
-		} catch (_err) {
-			// Swallow to keep the loop alive; event published by runner
-		}
-	}
-	setRunning(sessionId, false);
-	cleanupSession(sessionId);
-}
-/**
- * Ensures the finish tool is called if not already observed.
- */
-async function ensureFinishToolCalled(
-	finishObserved: boolean,
-	toolset: ReturnType<typeof adaptTools>,
-	sharedCtx: RunnerToolContext,
-	stepIndex: number,
-) {
-	if (finishObserved || !toolset?.finish?.execute) return;
-	const finishInput = {} as const;
-	const callOptions = { input: finishInput } as const;
-	sharedCtx.stepIndex = stepIndex;
-	try {
-		await toolset.finish.onInputStart?.(callOptions as never);
-	} catch {}
-	try {
-		await toolset.finish.onInputAvailable?.(callOptions as never);
-	} catch {}
-	await toolset.finish.execute(finishInput, {} as never);
-}
-/**
- * Main function to run the assistant for a given request.
- */
-async function runAssistant(opts: RunOpts) {
-	const cfgTimer = time('runner:loadConfig+db');
-	const cfg = await loadConfig(opts.projectRoot);
-	const db = await getDb(cfg.projectRoot);
-	cfgTimer.end();
-	const agentTimer = time('runner:resolveAgentConfig');
-	const agentCfg = await resolveAgentConfig(cfg.projectRoot, opts.agent);
-	agentTimer.end({ agent: opts.agent });
-	const agentPrompt = agentCfg.prompt || '';
-	const historyTimer = time('runner:buildHistory');
-	const history = await buildHistoryMessages(db, opts.sessionId);
-	historyTimer.end({ messages: history.length });
-	const isFirstMessage = history.length === 0;
-	const systemTimer = time('runner:composeSystemPrompt');
-	const { getAuth } = await import('@agi-cli/sdk');
-	const { getProviderSpoofPrompt } = await import('./prompt.ts');
-	const auth = await getAuth(opts.provider, cfg.projectRoot);
-	const needsSpoof = auth?.type === 'oauth';
-	const spoofPrompt = needsSpoof
-		? getProviderSpoofPrompt(opts.provider)
-		: undefined;
-	let system: string;
-	let additionalSystemMessages: Array<{ role: 'system'; content: string }> = [];
-	if (spoofPrompt) {
-		system = spoofPrompt;
-		const fullPrompt = await composeSystemPrompt({
-			provider: opts.provider,
-			model: opts.model,
-			projectRoot: cfg.projectRoot,
-			agentPrompt,
-			oneShot: opts.oneShot,
-			spoofPrompt: undefined,
-			includeProjectTree: isFirstMessage,
-		});
-		additionalSystemMessages = [{ role: 'system', content: fullPrompt }];
-	} else {
-		system = await composeSystemPrompt({
-			provider: opts.provider,
-			model: opts.model,
-			projectRoot: cfg.projectRoot,
-			agentPrompt,
-			oneShot: opts.oneShot,
-			spoofPrompt: undefined,
-			includeProjectTree: isFirstMessage,
-		});
-	}
-	systemTimer.end();
-	debugLog('[system] composed prompt (provider+base+agent):');
-	debugLog(system);
-	const toolsTimer = time('runner:discoverTools');
-	const allTools = await discoverProjectTools(cfg.projectRoot);
-	toolsTimer.end({ count: allTools.length });
-	const allowedNames = new Set([
-		...(agentCfg.tools || []),
-		'finish',
-		'progress_update',
-	]);
-	const gated = allTools.filter((t) => allowedNames.has(t.name));
-	const messagesWithSystemInstructions = [
-		...(isFirstMessage ? additionalSystemMessages : []),
-		...history,
-	];
-	const { sharedCtx, firstToolTimer, firstToolSeen } = await setupToolContext(
-		opts,
-		db,
-	);
-	const toolset = adaptTools(gated, sharedCtx);
-	const modelTimer = time('runner:resolveModel');
-	const model = await resolveModel(opts.provider, opts.model, cfg);
-	modelTimer.end();
-	const maxOutputTokens = getMaxOutputTokens(opts.provider, opts.model);
-	let currentPartId = opts.assistantPartId;
+export async function runAssistant(opts: RunOpts) {
+	const db = await getDb();
+	const config = await loadConfig();
+	const [provider, modelName] = opts.model.split('/', 2);
+	const model = resolveModel(provider, modelName);
+	// Build agent + system prompt
+	const agentConfig = resolveAgentConfig(opts.agent);
+	const availableTools = await discoverProjectTools(config.project.root);
+	const system = composeSystemPrompt(agentConfig, availableTools);
+	// Build message history
+	const history = await buildHistoryMessages(opts, db);
+	// Setup tool context
+	const toolContext = await setupToolContext(opts, db);
+	const { tools, sharedCtx } = toolContext;
+	// State
+	let currentPartId = sharedCtx.assistantPartId;
+	let stepIndex = sharedCtx.stepIndex;
 	let accumulated = '';
-	let stepIndex = 0;
+	const abortController = new AbortController();
-	let finishObserved = false;
-	const unsubscribeFinish = subscribe(opts.sessionId, (evt) => {
-		if (evt.type !== 'tool.result') return;
-		try {
-			const name = (evt.payload as { name?: string } | undefined)?.name;
-			if (name === 'finish') finishObserved = true;
-		} catch {}
-	});
-	const streamStartTimer = time('runner:first-delta');
-	let firstDeltaSeen = false;
-	debugLog(`[streamText] Calling with maxOutputTokens: ${maxOutputTokens}`);
-	// State management helpers
+	// State getters/setters
 	const getCurrentPartId = () => currentPartId;
 	const getStepIndex = () => stepIndex;
 	const updateCurrentPartId = (id: string) => {
@@ -214,12 +71,10 @@ async function runAssistant(opts: RunOpts) {
 	const updateAccumulated = (text: string) => {
 		accumulated = text;
 	};
-	const incrementStepIndex = () => {
-		stepIndex += 1;
-		return stepIndex;
-	};
+	const getAccumulated = () => accumulated;
+	const incrementStepIndex = () => ++stepIndex;
-	// Create stream handlers
+	// Handlers
 	const onStepFinish = createStepFinishHandler(
 		opts,
 		db,
@@ -229,85 +84,106 @@ async function runAssistant(opts: RunOpts) {
 		updateCurrentPartId,
 		updateAccumulated,
 		incrementStepIndex,
+		updateSessionTokensIncremental,
+		updateMessageTokensIncremental,
 	);
-	const onError = createErrorHandler(opts, db, getStepIndex, sharedCtx);
-	const onAbort = createAbortHandler(opts, db, getStepIndex, sharedCtx);
 	const onFinish = createFinishHandler(
 		opts,
 		db,
-		() => ensureFinishToolCalled(finishObserved, toolset, sharedCtx, stepIndex),
-		updateSessionTokens,
 		completeAssistantMessage,
+		getAccumulated,
+		abortController,
+	);
+	const _onAbort = createAbortHandler(opts, db, abortController);
+	const onError = createErrorHandler(opts, db);
+	// Context optimization
+	const contextOptimized = optimizeContext(history, {
+		deduplicateFiles: true,
+		maxToolResults: 30,
+	});
+	// Truncate history
+	const truncatedMessages = truncateHistory(contextOptimized, 20);
+	// Add cache control
+	const { system: cachedSystem, messages: optimizedMessages } = addCacheControl(
+		opts.provider,
+		system,
+		truncatedMessages,
 	);
 	try {
-		const result = streamText({
+		const maxTokens = getMaxOutputTokens(provider, modelName);
+		const result = await streamText({
 			model,
-			tools: toolset,
-			...(String(system || '').trim() ? { system } : {}),
-			messages: messagesWithSystemInstructions,
-			...(maxOutputTokens ? { maxOutputTokens } : {}),
-			abortSignal: opts.abortSignal,
-			stopWhen: hasToolCall('finish'),
+			system: cachedSystem,
+			messages: optimizedMessages,
+			tools,
+			maxSteps: 50,
+			maxTokens,
+			temperature: agentConfig.temperature ?? 0.7,
+			abortSignal: abortController.signal,
 			onStepFinish,
-			onError,
-			onAbort,
 			onFinish,
+			experimental_continueSteps: true,
 		});
+		// Process the stream
 		for await (const delta of result.textStream) {
-			if (!delta) continue;
-			if (!firstDeltaSeen) {
-				firstDeltaSeen = true;
-				streamStartTimer.end();
-			}
+			if (abortController.signal.aborted) break;
 			accumulated += delta;
-			publish({
-				type: 'message.part.delta',
+			if (currentPartId) {
+				await db
+					.update(messageParts)
+					.set({ content: accumulated })
+					.where(eq(messageParts.id, currentPartId));
+			}
+			publish('stream:text-delta', {
 				sessionId: opts.sessionId,
-				payload: {
-					messageId: opts.assistantMessageId,
-					partId: currentPartId,
-					stepIndex,
-					delta,
-				},
+				messageId: opts.assistantMessageId,
+				assistantMessageId: opts.assistantMessageId,
+				stepIndex,
+				textDelta: delta,
+				fullText: accumulated,
 			});
-			await db
-				.update(messageParts)
-				.set({ content: JSON.stringify({ text: accumulated }) })
-				.where(eq(messageParts.id, currentPartId));
 		}
-	} catch (error) {
-		const errorPayload = toErrorPayload(error);
-		await db
-			.update(messageParts)
-			.set({
-				content: JSON.stringify({
-					text: accumulated,
-					error: errorPayload.message,
-				}),
-			})
-			.where(eq(messageParts.messageId, opts.assistantMessageId));
-		publish({
-			type: 'error',
-			sessionId: opts.sessionId,
-			payload: {
-				messageId: opts.assistantMessageId,
-				error: errorPayload.message,
-				details: errorPayload.details,
-			},
-		});
-		throw error;
+	} catch (err) {
+		await onError(err);
 	} finally {
-		if (!firstToolSeen()) firstToolTimer.end({ skipped: true });
-		try {
-			unsubscribeFinish();
-		} catch {}
-		try {
-			await cleanupEmptyTextParts(opts, db);
-		} catch {}
+		setRunning(opts.sessionId, false);
+		dequeueJob(opts.sessionId);
 	}
 }
+/**
+ * Enqueues an assistant run
+ */
+export async function enqueueAssistantRun(opts: RunOpts) {
+	return enqueueRun(opts);
+}
+/**
+ * Aborts a running session
+ */
+export async function abortSession(sessionId: number) {
+	return abortSessionQueue(sessionId);
+}
+/**
+ * Gets the current runner state for a session
+ */
+export function getSessionState(sessionId: number) {
+	return getRunnerState(sessionId);
+}
+/**
+ * Cleanup session resources
+ */
+export function cleanupSessionResources(sessionId: number) {
+	return cleanupSession(sessionId);
+}

package/src/runtime/session-manager.ts CHANGED Viewed

@@ -50,6 +50,8 @@ export async function createSession({
 		lastActiveAt: null,
 		totalInputTokens: null,
 		totalOutputTokens: null,
+		totalCachedTokens: null,
+		totalReasoningTokens: null,
 		totalToolTimeMs: null,
 		toolCountsJson: null,
 	};