npm - omnikey-cli - Versions diffs - 1.0.23 → 1.0.25 - Mend

omnikey-cli 1.0.23 → 1.0.25

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (17) hide show

package/backend-dist/agent/agentAuth.js +134 -0
package/backend-dist/agent/agentServer.js +21 -143
package/backend-dist/agent/types.js +2 -0
package/backend-dist/agent/utils.js +104 -0
package/backend-dist/ai-client.js +40 -0
package/backend-dist/config.js +1 -1
package/backend-dist/index.js +25 -3
package/backend-dist/models/appDownload.js +34 -0
package/backend-dist/web-search/browser-playwright.js +613 -0
package/backend-dist/web-search/index.js +17 -0
package/backend-dist/web-search/llm-auth-check.js +127 -0
package/backend-dist/{web-search-provider.js → web-search/web-search-provider.js} +106 -18
package/dist/daemon.js +22 -7
package/dist/removeConfig.js +12 -4
package/package.json +3 -2
package/src/daemon.ts +29 -8
package/src/removeConfig.ts +18 -4

package/backend-dist/agent/agentAuth.js ADDED Viewed

@@ -0,0 +1,134 @@
+"use strict";
+var __importDefault = (this && this.__importDefault) || function (mod) {
+    return (mod && mod.__esModule) ? mod : { "default": mod };
+};
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.authenticateFromAuthHeader = authenticateFromAuthHeader;
+exports.createLazyAuthContext = createLazyAuthContext;
+const jsonwebtoken_1 = __importDefault(require("jsonwebtoken"));
+const config_1 = require("../config");
+const subscription_1 = require("../models/subscription");
+const authMiddleware_1 = require("../authMiddleware");
+/**
+ * Authenticates a WebSocket connection from a Bearer token in the Authorization header.
+ *
+ * In self-hosted mode, skips JWT verification and returns the self-hosted subscription directly.
+ * Otherwise, verifies the JWT, looks up the subscription by ID, and checks that it is not expired.
+ * Marks the subscription as expired and persists the change if the license key has passed its expiry date.
+ *
+ * @param authHeader - The raw `Authorization` header value (e.g. `"Bearer <token>"`).
+ * @param log - Logger instance scoped to the current connection.
+ * @returns The authenticated `Subscription`, or `null` if authentication fails for any reason.
+ */
+async function authenticateFromAuthHeader(authHeader, log) {
+    if (config_1.config.isSelfHosted) {
+        log.info('Self-hosted mode: skipping JWT authentication for agent WebSocket connection.');
+        try {
+            const subscription = await (0, authMiddleware_1.selfHostedSubscription)();
+            log.info('Retrieved self-hosted subscription for agent WebSocket connection', {
+                subscriptionId: subscription.id,
+            });
+            return subscription;
+        }
+        catch (err) {
+            log.error('Failed to retrieve self-hosted subscription for agent WebSocket connection', {
+                error: err,
+            });
+            return null;
+        }
+    }
+    if (!config_1.config.jwtSecret) {
+        log.error('JWT secret is not configured. Cannot authenticate subscription from auth header.');
+        return null;
+    }
+    if (!authHeader) {
+        log.warn('Agent WebSocket connection missing authorization header');
+        return null;
+    }
+    const [scheme, token] = authHeader.split(' ');
+    if (scheme !== 'Bearer' || !token) {
+        log.warn('Agent WebSocket connection has malformed authorization header');
+        return null;
+    }
+    try {
+        const decoded = jsonwebtoken_1.default.verify(token, config_1.config.jwtSecret);
+        const subscription = await subscription_1.Subscription.findByPk(decoded.sid);
+        if (!subscription) {
+            log.warn('Agent WebSocket auth failed: subscription not found', {
+                sid: decoded.sid,
+            });
+            return null;
+        }
+        if (subscription.subscriptionStatus === 'expired') {
+            log.warn('Agent WebSocket auth failed: subscription expired', {
+                sid: decoded.sid,
+            });
+            return null;
+        }
+        const now = new Date();
+        if (subscription.licenseKeyExpiresAt && subscription.licenseKeyExpiresAt <= now) {
+            subscription.subscriptionStatus = 'expired';
+            await subscription.save();
+            log.info('Agent WebSocket auth: subscription key expired during connection', {
+                subscriptionId: subscription.id,
+            });
+            return null;
+        }
+        log.debug('Agent WebSocket auth succeeded', {
+            subscriptionId: subscription.id,
+            status: subscription.subscriptionStatus,
+        });
+        return subscription;
+    }
+    catch (err) {
+        log.warn('Agent WebSocket auth failed: invalid or expired JWT', { error: err });
+        return null;
+    }
+}
+/**
+ * Creates a lazy authentication context for a WebSocket connection.
+ *
+ * Authentication is deferred until the first call to `ensureAuthenticated`, and the result
+ * is cached so subsequent calls resolve immediately without re-verifying the token.
+ * Concurrent calls during the first authentication are coalesced into a single in-flight promise.
+ *
+ * @param authHeader - The raw `Authorization` header value forwarded from the upgrade request.
+ * @param log - Logger instance scoped to the current connection.
+ * @returns An `AuthContext` with `ensureAuthenticated` and `getSubscription` accessors.
+ */
+function createLazyAuthContext(authHeader, log) {
+    let authenticatedSubscription = null;
+    let authFailed = false;
+    let authPromise = null;
+    const ensureAuthenticated = async () => {
+        if (authenticatedSubscription) {
+            return true;
+        }
+        if (authFailed) {
+            return false;
+        }
+        if (!authPromise) {
+            authPromise = (async () => {
+                try {
+                    const sub = await authenticateFromAuthHeader(authHeader, log);
+                    if (!sub) {
+                        authFailed = true;
+                        return;
+                    }
+                    authenticatedSubscription = sub;
+                    log.info('Agent WebSocket authenticated', {
+                        subscriptionId: authenticatedSubscription.id,
+                    });
+                }
+                catch (err) {
+                    authFailed = true;
+                    log.error('Unexpected error during agent WebSocket auth', { error: err });
+                }
+            })();
+        }
+        await authPromise;
+        return Boolean(authenticatedSubscription);
+    };
+    const getSubscription = () => authenticatedSubscription;
+    return { ensureAuthenticated, getSubscription };
+}

package/backend-dist/agent/agentServer.js CHANGED Viewed

@@ -38,7 +38,6 @@ var __importDefault = (this && this.__importDefault) || function (mod) {
 Object.defineProperty(exports, "__esModule", { value: true });
 exports.attachAgentWebSocketServer = attachAgentWebSocketServer;
 const ws_1 = __importStar(require("ws"));
-const jsonwebtoken_1 = __importDefault(require("jsonwebtoken"));
 const cuid_1 = __importDefault(require("cuid"));
 const config_1 = require("../config");
 const logger_1 = require("../logger");
@@ -46,8 +45,9 @@ const subscription_1 = require("../models/subscription");
 const subscriptionUsage_1 = require("../models/subscriptionUsage");
 const agentPrompts_1 = require("./agentPrompts");
 const featureRoutes_1 = require("../featureRoutes");
-const authMiddleware_1 = require("../authMiddleware");
-const web_search_provider_1 = require("../web-search-provider");
+const web_search_provider_1 = require("../web-search/web-search-provider");
+const agentAuth_1 = require("./agentAuth");
+const utils_1 = require("./utils");
 const ai_client_1 = require("../ai-client");
 async function runToolLoop(initialResult, session, sessionId, send, log, tools, onUsage) {
     const MAX_TOOL_ITERATIONS = 10;
@@ -61,7 +61,7 @@ async function runToolLoop(initialResult, session, sessionId, send, log, tools,
         // would leave the history ending with an assistant turn, causing a 400.
         if (!toolCalls.length)
             break;
-        session.history.push(result.assistantMessage);
+        (0, utils_1.pushToSessionHistory)(logger_1.logger, session, result.assistantMessage);
         log.info('Agent executing tool calls', {
             sessionId,
             turn: session.turns,
@@ -91,7 +91,7 @@ async function runToolLoop(initialResult, session, sessionId, send, log, tools,
             return { id: tc.id, name: tc.name, result: toolResult };
         }));
         for (const { id, name, result: toolResult } of toolResults) {
-            session.history.push({
+            (0, utils_1.pushToSessionHistory)(logger_1.logger, session, {
                 role: 'tool',
                 tool_call_id: id,
                 tool_name: name,
@@ -109,19 +109,19 @@ async function runToolLoop(initialResult, session, sessionId, send, log, tools,
     // force a final text response by calling again without tools.
     if (result.finish_reason === 'tool_calls') {
         log.warn('Tool loop hit MAX_TOOL_ITERATIONS; forcing final conclusion', { sessionId });
-        session.history.push(result.assistantMessage);
+        (0, utils_1.pushToSessionHistory)(logger_1.logger, session, result.assistantMessage);
         // The API requires a tool_result for every tool_use in the preceding
         // assistant message. Add synthetic results for any unexecuted calls so
         // the history remains valid before we send the follow-up user message.
         for (const tc of result.tool_calls ?? []) {
-            session.history.push({
+            (0, utils_1.pushToSessionHistory)(logger_1.logger, session, {
                 role: 'tool',
                 tool_call_id: tc.id,
                 tool_name: tc.name,
                 content: 'Tool call limit reached. Result unavailable.',
             });
         }
-        session.history.push({
+        (0, utils_1.pushToSessionHistory)(logger_1.logger, session, {
             role: 'user',
             content: 'You have reached the maximum number of tool calls. Do NOT make any further tool calls or web searches. You MUST now provide a final answer directly. If you still need to gather information from the system, generate a `<shell_scripts>` block instead of making tool calls.',
         });
@@ -136,10 +136,6 @@ async function runToolLoop(initialResult, session, sessionId, send, log, tools,
     });
     return result;
 }
-function buildAvailableTools() {
-    // web_search is always available — DuckDuckGo is used as free fallback
-    return [web_search_provider_1.WEB_FETCH_TOOL, web_search_provider_1.WEB_SEARCH_TOOL];
-}
 const aiModel = (0, ai_client_1.getDefaultModel)(config_1.config.aiProvider, 'smart');
 const sessionMessages = new Map();
 const MAX_TURNS = 10;
@@ -199,79 +195,6 @@ ${prompt}
         hasStoredPrompt: !!prompt,
     };
 }
-async function authenticateFromAuthHeader(authHeader, log) {
-    if (config_1.config.isSelfHosted) {
-        log.info('Self-hosted mode: skipping JWT authentication for agent WebSocket connection.');
-        try {
-            const subscription = await (0, authMiddleware_1.selfHostedSubscription)();
-            log.info('Retrieved self-hosted subscription for agent WebSocket connection', {
-                subscriptionId: subscription.id,
-            });
-            return subscription;
-        }
-        catch (err) {
-            log.error('Failed to retrieve self-hosted subscription for agent WebSocket connection', {
-                error: err,
-            });
-            return null;
-        }
-    }
-    if (!config_1.config.jwtSecret) {
-        log.error('JWT secret is not configured. Cannot authenticate subscription from auth header.');
-        return null;
-    }
-    if (!authHeader) {
-        log.warn('Agent WebSocket connection missing authorization header');
-        return null;
-    }
-    const [scheme, token] = authHeader.split(' ');
-    if (scheme !== 'Bearer' || !token) {
-        log.warn('Agent WebSocket connection has malformed authorization header');
-        return null;
-    }
-    try {
-        const decoded = jsonwebtoken_1.default.verify(token, config_1.config.jwtSecret);
-        const subscription = await subscription_1.Subscription.findByPk(decoded.sid);
-        if (!subscription) {
-            log.warn('Agent WebSocket auth failed: subscription not found', {
-                sid: decoded.sid,
-            });
-            return null;
-        }
-        if (subscription.subscriptionStatus === 'expired') {
-            log.warn('Agent WebSocket auth failed: subscription expired', {
-                sid: decoded.sid,
-            });
-            return null;
-        }
-        const now = new Date();
-        if (subscription.licenseKeyExpiresAt && subscription.licenseKeyExpiresAt <= now) {
-            subscription.subscriptionStatus = 'expired';
-            await subscription.save();
-            log.info('Agent WebSocket auth: subscription key expired during connection', {
-                subscriptionId: subscription.id,
-            });
-            return null;
-        }
-        log.debug('Agent WebSocket auth succeeded', {
-            subscriptionId: subscription.id,
-            status: subscription.subscriptionStatus,
-        });
-        return subscription;
-    }
-    catch (err) {
-        log.warn('Agent WebSocket auth failed: invalid or expired JWT', { error: err });
-        return null;
-    }
-}
-function createUserContent(content, hasStoredPrompt) {
-    return hasStoredPrompt
-        ? content
-            .toLowerCase()
-            .replace(/@omniagent/g, '')
-            .trim()
-        : content;
-}
 async function runAgentTurn(sessionId, subscription, clientMessage, send, log) {
     const { sessionState: session, hasStoredPrompt } = await getOrCreateSession(sessionId, subscription, clientMessage.platform, log);
     // Count this call as one agent iteration.
@@ -284,7 +207,7 @@ async function runAgentTurn(sessionId, subscription, clientMessage, send, log) {
     // On the MAX_TURNS iteration, instruct the LLM to provide a final,
     // consolidated answer based on the full conversation context.
     if (session.turns === MAX_TURNS) {
-        session.history.push({
+        (0, utils_1.pushToSessionHistory)(logger_1.logger, session, {
             role: 'system',
             content: 'Provide a single, final, concise answer based on the entire conversation so far. Wrap the answer in a <final_answer>...</final_answer> block and do not ask for further input or mention additional shell scripts to run. Do not include any <shell_script> block in this response.',
         });
@@ -314,17 +237,17 @@ async function runAgentTurn(sessionId, subscription, clientMessage, send, log) {
         // represent environment feedback that the agent must reason about next.
         // Pushing them as 'assistant' would create two consecutive assistant turns
         // which breaks most LLM APIs and prevents the model from processing the output.
-        session.history.push({
+        (0, utils_1.pushToSessionHistory)(logger_1.logger, session, {
             role: 'user',
             content: isAssistance
                 ? userContent
-                : `<user_input>${createUserContent(userContent, hasStoredPrompt)}</user_input>`,
+                : `<user_input>${(0, utils_1.createUserContent)(userContent, hasStoredPrompt)}</user_input>`,
         });
     }
     // On the final turn we omit tools so the model is forced to emit a
     // plain text <final_answer> rather than issuing another tool call.
     const isFinalTurn = session.turns >= MAX_TURNS;
-    const tools = isFinalTurn ? undefined : buildAvailableTools();
+    const tools = isFinalTurn ? undefined : (0, utils_1.buildAvailableTools)();
     const recordUsage = async (result) => {
         const usage = result.usage;
         if (!usage || !subscription.id || config_1.config.isSelfHosted)
@@ -366,7 +289,7 @@ async function runAgentTurn(sessionId, subscription, clientMessage, send, log) {
         if (!content && result.finish_reason !== 'tool_calls') {
             log.warn('Agent LLM returned empty content; sending generic error to client.');
             const errorMessage = 'The agent returned an empty response. Please try again.';
-            sendFinalAnswer(send, sessionId, errorMessage, true);
+            (0, utils_1.sendFinalAnswer)(send, sessionId, errorMessage, true);
             // Clear any cached session state so a subsequent attempt can
             // start fresh without a polluted history.
             sessionMessages.delete(sessionId);
@@ -380,7 +303,7 @@ async function runAgentTurn(sessionId, subscription, clientMessage, send, log) {
                 subscriptionId: subscription.id,
                 turn: session.turns,
             });
-            const toolLoopResult = await runToolLoop(result, session, sessionId, send, log, buildAvailableTools(), recordUsage);
+            const toolLoopResult = await runToolLoop(result, session, sessionId, send, log, (0, utils_1.buildAvailableTools)(), recordUsage);
             const toolLoopContent = toolLoopResult.content.trim();
             const toolLoopHasShell = toolLoopContent.includes('<shell_script>');
             const toolLoopHasFinal = toolLoopContent.includes('<final_answer>');
@@ -402,9 +325,9 @@ async function runAgentTurn(sessionId, subscription, clientMessage, send, log) {
                 // <final_answer>. The directive below tells it to use <shell_script> as
                 // a fallback instead of asking the user to run commands.
                 if (toolLoopResult.assistantMessage) {
-                    session.history.push(toolLoopResult.assistantMessage);
+                    (0, utils_1.pushToSessionHistory)(logger_1.logger, session, toolLoopResult.assistantMessage);
                 }
-                session.history.push({
+                (0, utils_1.pushToSessionHistory)(logger_1.logger, session, {
                     role: 'user',
                     content: webToolFailed
                         ? [
@@ -450,7 +373,7 @@ async function runAgentTurn(sessionId, subscription, clientMessage, send, log) {
                 turn: session.turns,
                 responseLength: result.content.length,
             });
-            session.history.push({
+            (0, utils_1.pushToSessionHistory)(logger_1.logger, session, {
                 role: 'assistant',
                 content,
             });
@@ -487,7 +410,7 @@ async function runAgentTurn(sessionId, subscription, clientMessage, send, log) {
                 subscriptionId: subscription.id,
                 turn: session.turns,
             });
-            session.history.push({ role: 'assistant', content });
+            (0, utils_1.pushToSessionHistory)(log, session, { role: 'assistant', content });
             send({
                 session_id: sessionId,
                 sender: 'agent',
@@ -499,64 +422,19 @@ async function runAgentTurn(sessionId, subscription, clientMessage, send, log) {
             log.warn('Agent returned empty content with no recognized tags; sending error', {
                 sessionId,
             });
-            sendFinalAnswer(send, sessionId, 'The agent returned an empty response. Please try again.', true);
+            (0, utils_1.sendFinalAnswer)(send, sessionId, 'The agent returned an empty response. Please try again.', true);
             sessionMessages.delete(sessionId);
         }
     }
     catch (err) {
         log.error('Agent LLM call failed', { error: err });
         const errorMessage = 'Agent failed to call language model. Please try again later.';
-        sendFinalAnswer(send, sessionId, errorMessage, true);
+        (0, utils_1.sendFinalAnswer)(send, sessionId, errorMessage, true);
         // Clear any cached session state so a subsequent attempt can
         // start fresh without being polluted by a failed turn.
         sessionMessages.delete(sessionId);
     }
 }
-function sendFinalAnswer(send, sessionId, message, isError) {
-    send({
-        session_id: sessionId,
-        sender: 'agent',
-        content: `<final_answer>\n${message}\n</final_answer>`,
-        is_terminal_output: false,
-        is_error: isError,
-    });
-}
-function createLazyAuthContext(authHeader, log) {
-    let authenticatedSubscription = null;
-    let authFailed = false;
-    let authPromise = null;
-    const ensureAuthenticated = async () => {
-        if (authenticatedSubscription) {
-            return true;
-        }
-        if (authFailed) {
-            return false;
-        }
-        if (!authPromise) {
-            authPromise = (async () => {
-                try {
-                    const sub = await authenticateFromAuthHeader(authHeader, log);
-                    if (!sub) {
-                        authFailed = true;
-                        return;
-                    }
-                    authenticatedSubscription = sub;
-                    log.info('Agent WebSocket authenticated', {
-                        subscriptionId: authenticatedSubscription.id,
-                    });
-                }
-                catch (err) {
-                    authFailed = true;
-                    log.error('Unexpected error during agent WebSocket auth', { error: err });
-                }
-            })();
-        }
-        await authPromise;
-        return Boolean(authenticatedSubscription);
-    };
-    const getSubscription = () => authenticatedSubscription;
-    return { ensureAuthenticated, getSubscription };
-}
 function attachAgentWebSocketServer(server) {
     const wss = new ws_1.WebSocketServer({ server, path: '/ws/omni-agent' });
     wss.on('connection', (ws, req) => {
@@ -565,7 +443,7 @@ function attachAgentWebSocketServer(server) {
         log.info('Agent WebSocket connection opened');
         const authHeaderValue = req.headers['authorization'];
         const authHeader = Array.isArray(authHeaderValue) ? authHeaderValue[0] : authHeaderValue;
-        const { ensureAuthenticated, getSubscription } = createLazyAuthContext(authHeader, log);
+        const { ensureAuthenticated, getSubscription } = (0, agentAuth_1.createLazyAuthContext)(authHeader, log);
         const send = (msg) => {
             try {
                 ws.send(JSON.stringify(msg));

package/backend-dist/agent/types.js ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ "use strict";
2	+ Object.defineProperty(exports, "__esModule", { value: true });

package/backend-dist/agent/utils.js ADDED Viewed

@@ -0,0 +1,104 @@
+"use strict";
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.buildAvailableTools = buildAvailableTools;
+exports.createUserContent = createUserContent;
+exports.sendFinalAnswer = sendFinalAnswer;
+exports.pushToSessionHistory = pushToSessionHistory;
+const web_search_provider_1 = require("../web-search/web-search-provider");
+const ai_client_1 = require("../ai-client");
+const config_1 = require("../config");
+/**
+ * Returns the set of web tools available to the agent for every turn.
+ *
+ * `web_search` is always included because DuckDuckGo is used as a free
+ * fallback when no third-party search key is configured.
+ *
+ * @returns An array of `AITool` definitions ready to pass to the AI client.
+ */
+function buildAvailableTools() {
+    return [web_search_provider_1.WEB_FETCH_TOOL, web_search_provider_1.WEB_SEARCH_TOOL];
+}
+/**
+ * Strips the `@omniagent` mention from user-supplied content.
+ *
+ * The desktop client prefixes messages with `@omniAgent` to trigger the agent.
+ * This helper removes that prefix (case-insensitive) so the raw directive
+ * reaches the model without the routing annotation.
+ *
+ * @param content - Raw content string from the client message.
+ * @param hasStoredPrompt - only remove the mention if the command has a stored prompt, otherwise it may be part of the user input
+ * @returns The cleaned content string with the mention removed and whitespace trimmed.
+ */
+function createUserContent(content, hasStoredPrompt) {
+    if (hasStoredPrompt) {
+        return content.replace(/@omniagent/gi, '').trim();
+    }
+    return content;
+}
+/**
+ * Sends a `<final_answer>` message over the WebSocket and closes the agent turn.
+ *
+ * Wraps `message` in `<final_answer>` tags so the client knows the agent has
+ * finished reasoning and can display the result. Used for both successful
+ * conclusions and error responses.
+ *
+ * @param send - The WebSocket send function scoped to the current connection.
+ * @param sessionId - ID of the session this answer belongs to.
+ * @param message - The final answer text to send to the client.
+ * @param isError - When `true`, the client renders the message as an error.
+ */
+function sendFinalAnswer(send, sessionId, message, isError) {
+    send({
+        session_id: sessionId,
+        sender: 'agent',
+        content: `<final_answer>\n${message}\n</final_answer>`,
+        is_terminal_output: false,
+        is_error: isError,
+    });
+}
+// Per-message hard string limit enforced by the provider API.
+const MAX_MESSAGE_CONTENT = (0, ai_client_1.getMaxMessageContentLength)(config_1.config.aiProvider);
+// Total character budget across all history messages (derived from the
+// provider's context-window size minus headroom for output + system prompt).
+const MAX_HISTORY_TOTAL = (0, ai_client_1.getMaxHistoryLength)(config_1.config.aiProvider);
+const FINAL_ANSWER_REQUEST = {
+    role: 'user',
+    content: 'Content was truncated because a length limit was reached. ' +
+        'You MUST stop making tool calls and provide a final answer immediately using <final_answer>...</final_answer>.',
+};
+/**
+ * Pushes a message onto the session history, enforcing two independent limits:
+ *
+ * 1. **Per-message limit** (`MAX_MESSAGE_CONTENT`) — the provider's hard cap
+ *    on a single content string (e.g. Anthropic: 10 MB, OpenAI/Gemini: context-bound).
+ * 2. **Total history limit** (`MAX_HISTORY_TOTAL`) — the cumulative character
+ *    budget derived from each provider's context-window size.
+ *
+ * When either limit is hit the message content is truncated and a separate
+ * `user` message is appended instructing the model to emit a final answer.
+ */
+function pushToSessionHistory(logger, session, message) {
+    if (typeof message.content !== 'string') {
+        session.history.push(message);
+        return;
+    }
+    let content = message.content;
+    let limitHit = false;
+    // 1. Per-message content limit.
+    if (content.length > MAX_MESSAGE_CONTENT) {
+        content = content.slice(0, MAX_MESSAGE_CONTENT);
+        limitHit = true;
+    }
+    // 2. Total history length limit.
+    const currentTotal = session.history.reduce((acc, msg) => acc + (typeof msg.content === 'string' ? msg.content.length : 0), 0);
+    const remaining = MAX_HISTORY_TOTAL - currentTotal;
+    if (content.length > remaining) {
+        content = content.slice(0, Math.max(0, remaining - FINAL_ANSWER_REQUEST.content.length));
+        limitHit = true;
+    }
+    session.history.push({ ...message, content });
+    if (limitHit) {
+        logger.warn(`History limits exceeded. Message truncated to ${content.length} chars, total history is now ${currentTotal + content.length} chars.`);
+        session.history.push(FINAL_ANSWER_REQUEST);
+    }
+}

package/backend-dist/ai-client.js CHANGED Viewed

@@ -5,6 +5,8 @@ var __importDefault = (this && this.__importDefault) || function (mod) {
 Object.defineProperty(exports, "__esModule", { value: true });
 exports.aiClient = exports.AIClient = void 0;
 exports.getDefaultModel = getDefaultModel;
+exports.getMaxMessageContentLength = getMaxMessageContentLength;
+exports.getMaxHistoryLength = getMaxHistoryLength;
 const openai_1 = __importDefault(require("openai"));
 const sdk_1 = __importDefault(require("@anthropic-ai/sdk"));
 const genai_1 = require("@google/genai");
@@ -21,6 +23,44 @@ const DEFAULT_MODELS = {
 function getDefaultModel(provider, tier) {
     return DEFAULT_MODELS[provider][tier];
 }
+/**
+ * Maximum character length for a single message content string per provider.
+ *
+ * - anthropic: hard API-enforced string limit of 10,485,760 chars; we stay
+ *              just below it with a small safety buffer.
+ * - openai:    no documented per-string limit; bounded by the context window
+ *              (~272K tokens for GPT-5.1 ≈ ~1M chars). Use the history cap.
+ * - gemini:    no documented per-string limit; bounded by the 1M-token
+ *              context window (~4M chars). Use the history cap.
+ */
+const MAX_MESSAGE_CONTENT_LENGTH_BY_PROVIDER = {
+    anthropic: 10000000,
+    openai: 800000,
+    gemini: 3500000,
+};
+/**
+ * Maximum total character length across all messages in the conversation
+ * history, derived from each provider's context-window size minus headroom
+ * for the system prompt and max output tokens.
+ *
+ * - anthropic: Claude Sonnet 4.6 — 1M token ctx, 64K max output
+ *              ≈ (1,000,000 - 64,000 - 10,000) tokens × 4 chars ≈ 3.7M chars
+ * - openai:    GPT-5.1 — ~272K token ctx, ~32K max output
+ *              ≈ (272,000 - 32,000 - 5,000) tokens × 4 chars ≈ 940K chars
+ * - gemini:    Gemini 2.5 Pro — 1M token ctx, ~32K max output
+ *              ≈ (1,000,000 - 32,000 - 10,000) tokens × 4 chars ≈ 3.8M chars
+ */
+const MAX_HISTORY_LENGTH_BY_PROVIDER = {
+    anthropic: 3500000,
+    openai: 800000,
+    gemini: 3500000,
+};
+function getMaxMessageContentLength(provider) {
+    return MAX_MESSAGE_CONTENT_LENGTH_BY_PROVIDER[provider];
+}
+function getMaxHistoryLength(provider) {
+    return MAX_HISTORY_LENGTH_BY_PROVIDER[provider];
+}
 // ---------------------------------------------------------------------------
 // OpenAI adapter
 // ---------------------------------------------------------------------------

package/backend-dist/config.js CHANGED Viewed

@@ -91,5 +91,5 @@ exports.config = {
     braveSearchApiKey: getEnv('BRAVE_SEARCH_API_KEY', false),
     tavilyApiKey: getEnv('TAVILY_API_KEY', false),
     searxngUrl: getEnv('SEARXNG_URL', false),
-    terminalPlatform: getEnv('TERMINAL_PLATFORM', false)
+    terminalPlatform: getEnv('TERMINAL_PLATFORM', false),
 };