npm - @xalia/agent - Versions diffs - 0.6.9 → 0.6.11 - Mend

@xalia/agent 0.6.9 → 0.6.11

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (199) hide show

package/README.md +11 -0
package/dist/agent/src/agent/agent.js +77 -18
package/dist/agent/src/agent/agentUtils.js +3 -2
package/dist/agent/src/agent/documentSummarizer.js +126 -0
package/dist/agent/src/agent/dummyLLM.js +25 -22
package/dist/agent/src/agent/imageGenLLM.js +22 -19
package/dist/agent/src/agent/llm.js +1 -1
package/dist/agent/src/agent/openAILLM.js +15 -12
package/dist/agent/src/agent/openAILLMStreaming.js +68 -37
package/dist/agent/src/agent/repeatLLM.js +16 -7
package/dist/agent/src/agent/tokenCounter.js +390 -0
package/dist/agent/src/agent/tokenCounter.test.js +206 -0
package/dist/agent/src/agent/toolSettings.js +17 -0
package/dist/agent/src/agent/tools/calculatorTool.js +45 -0
package/dist/agent/src/agent/tools/contentExtractors/pdfToText.js +55 -0
package/dist/agent/src/agent/tools/datetimeTool.js +38 -0
package/dist/agent/src/agent/tools/fileManager/fileManagerTool.js +156 -0
package/dist/agent/src/agent/tools/fileManager/index.js +31 -0
package/dist/agent/src/agent/tools/fileManager/memoryFileManager.js +102 -0
package/dist/agent/src/{chat/data → agent/tools/fileManager}/mimeTypes.js +3 -1
package/dist/agent/src/agent/tools/fileManager/prompt.js +33 -0
package/dist/agent/src/{chat/data/dbSessionFileModels.js → agent/tools/fileManager/types.js} +7 -0
package/dist/agent/src/agent/tools/index.js +64 -0
package/dist/agent/src/agent/tools/openUrlTool.js +57 -0
package/dist/agent/src/agent/tools/renderTool.js +89 -0
package/dist/agent/src/agent/tools/utils.js +61 -0
package/dist/agent/src/{chat/utils/search.js → agent/tools/webSearch.js} +1 -2
package/dist/agent/src/agent/tools/webSearchTool.js +40 -0
package/dist/agent/src/chat/client/chatClient.js +28 -0
package/dist/agent/src/chat/client/index.js +4 -1
package/dist/agent/src/chat/client/sessionClient.js +28 -2
package/dist/agent/src/chat/constants.js +8 -0
package/dist/agent/src/chat/data/dbSessionFiles.js +11 -6
package/dist/agent/src/chat/protocol/messages.js +5 -0
package/dist/agent/src/chat/server/chatContextManager.js +45 -25
package/dist/agent/src/chat/server/conversation.js +3 -0
package/dist/agent/src/chat/server/imageGeneratorTools.js +20 -8
package/dist/agent/src/chat/server/openAIRouterLLM.js +0 -3
package/dist/agent/src/chat/server/openSession.js +218 -55
package/dist/agent/src/chat/server/promptRefiner.js +86 -0
package/dist/agent/src/chat/server/server.js +5 -1
package/dist/agent/src/chat/server/sessionFileManager.js +22 -221
package/dist/agent/src/chat/server/sessionRegistry.js +87 -0
package/dist/agent/src/chat/server/titleGenerator.js +112 -0
package/dist/agent/src/chat/server/titleGenerator.test.js +113 -0
package/dist/agent/src/chat/server/tools.js +63 -287
package/dist/agent/src/chat/utils/approvalManager.js +6 -3
package/dist/agent/src/chat/utils/multiAsyncQueue.js +3 -0
package/dist/agent/src/test/agent.test.js +16 -17
package/dist/agent/src/test/chatContextManager.test.js +15 -3
package/dist/agent/src/test/dbMcpServerConfigs.test.js +4 -4
package/dist/agent/src/test/dbSessionFiles.test.js +17 -17
package/dist/agent/src/test/testTools.js +6 -1
package/dist/agent/src/test/tools.test.js +27 -9
package/dist/agent/src/tool/agentChat.js +5 -2
package/dist/agent/src/tool/chatMain.js +34 -7
package/dist/agent/src/tool/commandPrompt.js +2 -2
package/dist/agent/src/tool/files.js +7 -8
package/package.json +8 -2
package/.env.development +0 -1
package/.prettierrc.json +0 -11
package/dist/agent/src/agent/tools.js +0 -44
package/eslint.config.mjs +0 -38
package/scripts/chat_server +0 -8
package/scripts/git_message +0 -31
package/scripts/git_wip +0 -21
package/scripts/pr_message +0 -18
package/scripts/pr_review +0 -16
package/scripts/setup_chat +0 -90
package/scripts/shutdown_chat_server +0 -42
package/scripts/start_chat_server +0 -24
package/scripts/sudomcp_import +0 -23
package/scripts/test_chat +0 -308
package/src/agent/agent.ts +0 -624
package/src/agent/agentUtils.ts +0 -285
package/src/agent/compressingContextManager.ts +0 -129
package/src/agent/context.ts +0 -265
package/src/agent/contextWithWorkspace.ts +0 -162
package/src/agent/dummyLLM.ts +0 -126
package/src/agent/iAgentEventHandler.ts +0 -64
package/src/agent/imageGenLLM.ts +0 -97
package/src/agent/imageGenerator.ts +0 -45
package/src/agent/iplatform.ts +0 -18
package/src/agent/llm.ts +0 -74
package/src/agent/mcpServerManager.ts +0 -541
package/src/agent/nullAgentEventHandler.ts +0 -26
package/src/agent/nullPlatform.ts +0 -13
package/src/agent/openAI.ts +0 -123
package/src/agent/openAILLM.ts +0 -95
package/src/agent/openAILLMStreaming.ts +0 -609
package/src/agent/promptProvider.ts +0 -87
package/src/agent/repeatLLM.ts +0 -50
package/src/agent/sudoMcpServerManager.ts +0 -361
package/src/agent/tokenAuth.ts +0 -50
package/src/agent/tools.ts +0 -57
package/src/chat/client/chatClient.ts +0 -922
package/src/chat/client/connection.test.ts +0 -241
package/src/chat/client/connection.ts +0 -286
package/src/chat/client/constants.ts +0 -1
package/src/chat/client/index.ts +0 -18
package/src/chat/client/interfaces.ts +0 -34
package/src/chat/client/sessionClient.ts +0 -537
package/src/chat/client/sessionFiles.ts +0 -142
package/src/chat/client/teamManager.ts +0 -29
package/src/chat/data/apiKeyManager.ts +0 -76
package/src/chat/data/dataModels.ts +0 -101
package/src/chat/data/database.ts +0 -997
package/src/chat/data/dbMcpServerConfigs.ts +0 -59
package/src/chat/data/dbSessionFileModels.ts +0 -113
package/src/chat/data/dbSessionFiles.ts +0 -99
package/src/chat/data/dbSessionMessages.ts +0 -102
package/src/chat/data/mimeTypes.ts +0 -58
package/src/chat/protocol/connectionMessages.ts +0 -49
package/src/chat/protocol/constants.ts +0 -55
package/src/chat/protocol/errors.ts +0 -16
package/src/chat/protocol/messages.ts +0 -846
package/src/chat/server/README.md +0 -127
package/src/chat/server/chatContextManager.ts +0 -639
package/src/chat/server/connectionManager.test.ts +0 -246
package/src/chat/server/connectionManager.ts +0 -506
package/src/chat/server/conversation.ts +0 -316
package/src/chat/server/errorUtils.ts +0 -28
package/src/chat/server/imageGeneratorTools.ts +0 -160
package/src/chat/server/openAIRouterLLM.ts +0 -171
package/src/chat/server/openSession.ts +0 -1689
package/src/chat/server/openSessionMessageSender.ts +0 -4
package/src/chat/server/server.ts +0 -175
package/src/chat/server/sessionFileManager.ts +0 -422
package/src/chat/server/sessionRegistry.test.ts +0 -137
package/src/chat/server/sessionRegistry.ts +0 -1425
package/src/chat/server/test-utils/mockFactories.ts +0 -422
package/src/chat/server/tools.ts +0 -397
package/src/chat/utils/agentSessionMap.ts +0 -76
package/src/chat/utils/approvalManager.ts +0 -183
package/src/chat/utils/asyncLock.ts +0 -43
package/src/chat/utils/asyncQueue.ts +0 -62
package/src/chat/utils/htmlToText.ts +0 -61
package/src/chat/utils/multiAsyncQueue.ts +0 -62
package/src/chat/utils/responseAwaiter.ts +0 -181
package/src/chat/utils/search.ts +0 -139
package/src/chat/utils/userResolver.ts +0 -48
package/src/chat/utils/websocket.ts +0 -16
package/src/index.ts +0 -0
package/src/test/agent.test.ts +0 -590
package/src/test/approvalManager.test.ts +0 -141
package/src/test/chatContextManager.test.ts +0 -527
package/src/test/clientServerConnection.test.ts +0 -205
package/src/test/compressingContextManager.test.ts +0 -77
package/src/test/context.test.ts +0 -150
package/src/test/contextTestTools.ts +0 -95
package/src/test/conversation.test.ts +0 -109
package/src/test/db.test.ts +0 -363
package/src/test/dbMcpServerConfigs.test.ts +0 -112
package/src/test/dbSessionFiles.test.ts +0 -258
package/src/test/dbSessionMessages.test.ts +0 -85
package/src/test/dbTestTools.ts +0 -157
package/src/test/imageLoad.test.ts +0 -15
package/src/test/mcpServerManager.test.ts +0 -114
package/src/test/multiAsyncQueue.test.ts +0 -183
package/src/test/openaiStreaming.test.ts +0 -177
package/src/test/prompt.test.ts +0 -27
package/src/test/promptProvider.test.ts +0 -33
package/src/test/responseAwaiter.test.ts +0 -103
package/src/test/sudoMcpServerManager.test.ts +0 -63
package/src/test/testTools.ts +0 -171
package/src/test/tools.test.ts +0 -39
package/src/tool/agentChat.ts +0 -194
package/src/tool/agentMain.ts +0 -180
package/src/tool/chatMain.ts +0 -594
package/src/tool/commandPrompt.ts +0 -264
package/src/tool/files.ts +0 -84
package/src/tool/main.ts +0 -25
package/src/tool/nodePlatform.ts +0 -73
package/src/tool/options.ts +0 -144
package/src/tool/prompt.ts +0 -101
package/test_data/background_test_profile.json +0 -6
package/test_data/background_test_script.json +0 -11
package/test_data/dummyllm_script_crash.json +0 -32
package/test_data/dummyllm_script_image_gen.json +0 -19
package/test_data/dummyllm_script_image_gen_fe.json +0 -29
package/test_data/dummyllm_script_invoke_image_gen_tool.json +0 -37
package/test_data/dummyllm_script_render_tool.json +0 -29
package/test_data/dummyllm_script_simplecalc.json +0 -28
package/test_data/dummyllm_script_test_auto_approve.json +0 -81
package/test_data/dummyllm_script_test_simplecalc_addition.json +0 -29
package/test_data/frog.png +0 -0
package/test_data/frog.png.b64 +0 -1
package/test_data/git_message_profile.json +0 -4
package/test_data/git_wip_system.txt +0 -5
package/test_data/image_gen_test_profile.json +0 -5
package/test_data/pr_message_profile.json +0 -4
package/test_data/pr_review_profile.json +0 -4
package/test_data/prompt_simplecalc.txt +0 -1
package/test_data/simplecalc_profile.json +0 -4
package/test_data/sudomcp_import_profile.json +0 -4
package/test_data/test_script_profile.json +0 -8
package/tsconfig.json +0 -13
package/vitest.config.ts +0 -39
/package/dist/agent/src/{chat/utils → agent/tools/contentExtractors}/htmlToText.js +0 -0

package/README.md CHANGED Viewed

@@ -25,6 +25,17 @@ Example of running agent can be found in [test script](../mcppro/scripts/test_sc
 ## Architecture
+For a detailed explanation of the context system architecture, including how context is formed, compressed, and managed during agent execution, see:
+**📚 [Context System Architecture Documentation](../context_system.md)**
+This document covers:
+- Context window structure and composition
+- System prompt fragment injection
+- Automatic context compression
+- Session file handling
+- Transaction-based message flow
 ### Core Components
 #### Agent (`src/agent/`)

package/dist/agent/src/agent/agent.js CHANGED Viewed

@@ -1,6 +1,6 @@
 "use strict";
 Object.defineProperty(exports, "__esModule", { value: true });
-exports.Agent = exports.AgentEx = exports.DEFAULT_LLM_URL = exports.AgentProfile = void 0;
+exports.Agent = exports.AgentEx = exports.USER_STOP_MESSAGE = exports.DEFAULT_LLM_URL = exports.AgentProfile = void 0;
 exports.createUserMessage = createUserMessage;
 exports.createUserMessageEnsure = createUserMessageEnsure;
 exports.completionToAssistantMessageParam = completionToAssistantMessageParam;
@@ -9,9 +9,20 @@ var sdk_1 = require("@xalia/xmcp/sdk");
 Object.defineProperty(exports, "AgentProfile", { enumerable: true, get: function () { return sdk_1.AgentProfile; } });
 const sdk_2 = require("@xalia/xmcp/sdk");
 const mcpServerManager_1 = require("./mcpServerManager");
+const toolSettings_1 = require("./toolSettings");
 exports.DEFAULT_LLM_URL = "http://localhost:5001/v1";
-const MAX_TOOL_CALL_RESPONSE_LENGTH = 4000;
+/**
+ * The message to append to the agent output if the agent is interrupted by a
+ * signal from the user.
+ */
+exports.USER_STOP_MESSAGE = " AGENT INTERRUPTED";
 const logger = (0, sdk_2.getLogger)();
+/**
+ * An agent attached to an ILLM which updates a context via an
+ * IContextTransaction interface (where IContextTransaction is like a DB tx or
+ * DB writer, for staging changes and reading back state as-if those changes
+ * were applied).
+ */
 class AgentEx {
     constructor(mcpServerManager, llm) {
         /// The full list of tools, ready to pass to the LLM
@@ -21,15 +32,25 @@ class AgentEx {
         this.agentTools = new Map();
         this.mcpServerManager = mcpServerManager;
         this.llm = llm;
+        this.stopFlag = false;
+        this.stopFn = undefined;
     }
     async shutdown() {
+        this.stop("shutting down");
         return this.mcpServerManager.shutdown();
     }
+    stop(msg) {
+        this.stopFlag = true;
+        if (this.stopFn) {
+            this.stopFn(msg || exports.USER_STOP_MESSAGE);
+        }
+    }
     getMcpServerManager() {
         return this.mcpServerManager;
     }
     // TODO: rename
     async userMessagesRaw(contextTx, eventHandler) {
+        this.stopFlag = false;
         // New user messages have already been added to the `contextTx`.
         // Image and audio handling
         //
@@ -47,6 +68,11 @@ class AgentEx {
         contextTx.addMessage(message);
         // While there are tool calls to make, invoke them and loop
         while (message.tool_calls && message.tool_calls.length > 0) {
+            // Signal the event handler of the assistant message with tool calls
+            // BEFORE processing tool results. This ensures the order of messages
+            // in pendingMessages matches the order in the LLM context:
+            // [user, assistant(tool_calls), tool_result, assistant(final)]
+            eventHandler.onCompletion(message);
             // TODO: Execute all tool calls in parallel
             // [indexInContext, ToolCallResult][]
             const toolCallResults = [];
@@ -66,6 +92,11 @@ class AgentEx {
                 };
                 const toolResultHandle = contextTx.addMessage(toolResult);
                 toolCallResults.push([toolResultHandle, result]);
+                // Immediately broadcast the tool result to the frontend for UI
+                // feedback. This ensures the frontend knows the tool executed
+                // successfully without waiting for the next LLM completion to
+                // finish streaming
+                eventHandler.onToolCallResult(toolResult);
                 // If the tool call requested that its args be redacted, this can be
                 // done now - before the next LLM invocation.
                 if (result.overwriteArgs) {
@@ -74,9 +105,6 @@ class AgentEx {
                     logger.debug(`agent message after update ${JSON.stringify(message)}`);
                 }
             }
-            // Now that any args have been overwritten, signal the event handler of
-            // the prevoius completion.
-            eventHandler.onCompletion(message);
             // Get a new completion using the untouched tool call results.  Note
             // that, since we are deferring the `onToolCallResult` calls (so they
             // can be redacted), we must take care that the errors in
@@ -89,17 +117,15 @@ class AgentEx {
             }
             finally {
                 // Now that the tool call results have been passed to the LLM, perform
-                // any updates on them.  Pass the (updated) tool-call-result LLM
-                // messages to the event handler - note, we want to do this even if an
-                // error occured, so that the caller has an up-to-date picture of the
-                // context state when the error occured.
+                // any updates on them if overwriteResponse was requested. If so, send
+                // the updated tool result to the frontend to replace the original.
                 toolCallResults.forEach(([handle, tcr]) => {
-                    const ctxMsg = contextTx.getMessage(handle);
                     if (tcr.overwriteResponse) {
+                        const ctxMsg = contextTx.getMessage(handle);
                         ctxMsg.content = tcr.overwriteResponse;
+                        (0, assert_1.strict)(ctxMsg.role === "tool");
+                        eventHandler.onToolCallResult(ctxMsg);
                     }
-                    (0, assert_1.strict)(ctxMsg.role === "tool");
-                    eventHandler.onToolCallResult(ctxMsg);
                 });
                 // Note, if an error DID occur, the ContextManager does not see any of
                 // the new context.
@@ -110,6 +136,26 @@ class AgentEx {
         return { message, images: images.length === 0 ? undefined : images };
     }
     async chatCompletion(context, eventHandler) {
+        if (this.stopFlag) {
+            return {
+                id: "user_stopped",
+                choices: [
+                    {
+                        finish_reason: "stop",
+                        index: 0,
+                        message: {
+                            content: exports.USER_STOP_MESSAGE,
+                            role: "assistant",
+                            refusal: null,
+                        },
+                        logprobs: null,
+                    },
+                ],
+                created: Date.now(),
+                model: this.llm.getModel(),
+                object: "chat.completion",
+            };
+        }
         // Compute the full list of available tools
         let tools;
         const mcpTools = this.mcpServerManager.getOpenAITools();
@@ -119,7 +165,15 @@ class AgentEx {
             tools = enabledTools;
         }
         logger.debug(`[chatCompletion] tools: ${JSON.stringify(tools)}`);
-        const completion = await this.llm.getConversationResponse(context, tools, eventHandler.onAgentMessage.bind(eventHandler), eventHandler.onReasoning.bind(eventHandler));
+        // Log system prompt length
+        if (context.length > 0 && context[0].role === "system") {
+            const systemPrompt = context[0].content;
+            logger.info(`[chatCompletion] System prompt length: ${String(systemPrompt.length)}`);
+        }
+        const { stop, completion: completionP } = await this.llm.getConversationResponse(context, tools, eventHandler.onAgentMessage.bind(eventHandler), eventHandler.onReasoning.bind(eventHandler));
+        this.stopFn = stop;
+        const completion = await completionP;
+        this.stopFn = undefined;
         logger.debug(`Received chat completion ${JSON.stringify(completion)}`);
         return completion;
     }
@@ -161,6 +215,9 @@ class AgentEx {
      * ChatCompletionToolMessageParam to be used in the conversation.
      */
     async doToolCall(toolCall, eventHandler) {
+        if (this.stopFlag) {
+            return { response: exports.USER_STOP_MESSAGE };
+        }
         // If the tool is and "agent" (internal) tool, we can just execute it.
         // Otherwise, call the event handler to get permission and invoke the
         // external tool handler.
@@ -210,11 +267,11 @@ class AgentEx {
             };
         }
         // Final sanity check on the tool call response length.
-        if (result.response.length > MAX_TOOL_CALL_RESPONSE_LENGTH) {
+        if (result.response.length > toolSettings_1.MAX_TOOL_CALL_RESPONSE_LENGTH) {
             logger.warn("[Agent.doToolCall]: truncating tool call result.response for call:\n" +
                 JSON.stringify(toolCall));
             result.response =
-                result.response.slice(0, MAX_TOOL_CALL_RESPONSE_LENGTH) +
+                result.response.slice(0, toolSettings_1.MAX_TOOL_CALL_RESPONSE_LENGTH) +
                     " ..truncated";
         }
         return result;
@@ -233,8 +290,10 @@ class AgentEx {
 }
 exports.AgentEx = AgentEx;
 /**
- * Higher-level abstraction over AgentEx, which abstracts out the transactions
- * to the context manager.
+ * Higher-level abstraction over AgentEx, which abstracts out the context
+ * transactions.  A single agent is associated with an IContextManager and
+ * internally creates and commits transactions during each call to
+ * `userMessage*`.
  */
 class Agent {
     constructor(eventHandler, mcpServerManager, llm, contextManager) {
@@ -346,7 +405,7 @@ function createUserMessage(msg, imageB64, name) {
 }
 function createUserMessageEnsure(msg, imageB64, name) {
     const userMsg = createUserMessage(msg, imageB64, name);
-    (0, assert_1.strict)(userMsg);
+    (0, assert_1.strict)(userMsg, "createUserMessageEnsure");
     return userMsg;
 }
 function completionToAssistantMessageParam(compMessage) {

package/dist/agent/src/agent/agentUtils.js CHANGED Viewed

@@ -55,8 +55,9 @@ async function createSpecializedLLM(model, platform) {
     if (model && model.startsWith("dummy:")) {
         llm = await dummyLLM_1.DummyLLM.initFromModelUrl(model, platform);
     }
-    else if (model === "repeat") {
-        llm = new repeatLLM_1.RepeatLLM();
+    else if (model && model.startsWith("repeat")) {
+        const prefix = model.startsWith("repeat:") ? model.slice(7) : "";
+        llm = new repeatLLM_1.RepeatLLM(prefix);
     }
     return llm;
 }

package/dist/agent/src/agent/documentSummarizer.js ADDED Viewed

@@ -0,0 +1,126 @@
+"use strict";
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.LLMDocumentSummarizer = void 0;
+exports.createDocumentSummarizer = createDocumentSummarizer;
+exports.summarizeDocument = summarizeDocument;
+const openAIRouterLLM_1 = require("../chat/server/openAIRouterLLM");
+const sdk_1 = require("@xalia/xmcp/sdk");
+const logger = (0, sdk_1.getLogger)();
+const SUMMARY_MODEL = "google/gemini-2.5-flash";
+const SUMMARY_MAX_TOKENS = 500;
+const SUMMARY_TEMPERATURE = 0.3;
+const SUMMARY_TIMEOUT_MS = 30000;
+const MAX_CONTENT_LENGTH = 100000;
+/**
+ * System prompt for document summarization, optimized for recall.
+ */
+const SUMMARY_SYSTEM_PROMPT = `You are a document summarizer optimizing for RECALL. Create a summary ` +
+    `(3-10 sentences) that captures:
+- Main topic and purpose of the document
+- Key entities (names, organizations, places, dates, numbers)
+- Important concepts, terms, and topics mentioned
+- Any conclusions, results, or key findings
+Include specific details that would help locate this document later.
+Use keywords and phrases from the original text.
+Do NOT include meta-commentary about the document format.
+Output ONLY the summary text.`;
+class LLMDocumentSummarizer {
+    constructor(model = SUMMARY_MODEL) {
+        this.model = model;
+    }
+    async summarize(content) {
+        if (!content || content.trim().length === 0) {
+            return "Empty document";
+        }
+        try {
+            const summary = await this.summarizeWithTimeout(content);
+            return this.sanitizeSummary(summary);
+        }
+        catch (error) {
+            const errorMsg = error instanceof Error ? error.message : String(error);
+            logger.warn(`[DocumentSummarizer] LLM summarization failed: ${errorMsg}, ` +
+                `using fallback`);
+            return this.fallbackSummary(content);
+        }
+    }
+    async summarizeWithTimeout(content) {
+        const timeoutPromise = new Promise((_, reject) => {
+            setTimeout(() => {
+                reject(new Error("Summary generation timeout"));
+            }, SUMMARY_TIMEOUT_MS);
+        });
+        const summaryPromise = this.callLLM(content);
+        return Promise.race([summaryPromise, timeoutPromise]);
+    }
+    async callLLM(content) {
+        const client = (0, openAIRouterLLM_1.getOpenAIClient)(this.model);
+        const truncatedContent = content.length > MAX_CONTENT_LENGTH
+            ? content.slice(0, MAX_CONTENT_LENGTH) + "\n\n[Content truncated...]"
+            : content;
+        const response = await client.chat.completions.create({
+            model: this.model,
+            messages: [
+                {
+                    role: "system",
+                    content: SUMMARY_SYSTEM_PROMPT,
+                },
+                {
+                    role: "user",
+                    content: `Please summarize this document:\n\n${truncatedContent}`,
+                },
+            ],
+            max_tokens: SUMMARY_MAX_TOKENS,
+            temperature: SUMMARY_TEMPERATURE,
+        });
+        const summary = response.choices[0]?.message?.content?.trim();
+        if (!summary) {
+            throw new Error("Empty response from LLM");
+        }
+        return summary;
+    }
+    sanitizeSummary(summary) {
+        return summary.replace(/\s+/g, " ").trim();
+    }
+    fallbackSummary(content) {
+        const cleaned = content.trim();
+        if (cleaned.length === 0) {
+            return "Empty document";
+        }
+        const firstParagraph = cleaned.split(/\n\n/)[0];
+        const maxLength = 500;
+        if (firstParagraph.length <= maxLength) {
+            return firstParagraph;
+        }
+        return cleaned.slice(0, maxLength).trim() + "...";
+    }
+}
+exports.LLMDocumentSummarizer = LLMDocumentSummarizer;
+class FallbackDocumentSummarizer {
+    // eslint-disable-next-line @typescript-eslint/require-await
+    async summarize(content) {
+        const cleaned = content.trim();
+        if (cleaned.length === 0) {
+            return "Empty document";
+        }
+        const firstParagraph = cleaned.split(/\n\n/)[0];
+        const maxLength = 500;
+        if (firstParagraph.length <= maxLength) {
+            return firstParagraph;
+        }
+        return cleaned.slice(0, maxLength).trim() + "...";
+    }
+}
+function createDocumentSummarizer(model) {
+    if (process.env.DISABLE_LLM_SUMMARIES === "true") {
+        return new FallbackDocumentSummarizer();
+    }
+    return new LLMDocumentSummarizer(model);
+}
+/**
+ * Convenience function for one-off summarization.
+ */
+async function summarizeDocument(content) {
+    const summarizer = createDocumentSummarizer();
+    return summarizer.summarize(content);
+}

package/dist/agent/src/agent/dummyLLM.js CHANGED Viewed

@@ -50,31 +50,34 @@ class DummyLLM {
     }
     async getConversationResponse(messages, _tools, onMessage, onReasoning) {
         await new Promise((r) => setTimeout(r, 0));
-        (0, assert_1.strict)(this.idx < this.responses.length);
         this.lastRequest = messages;
-        for (;;) {
-            const response = this.responses[this.idx++];
-            if (response.finish_reason === "error") {
-                throw new Error(response.message);
-            }
-            if (response.finish_reason === "reasoning") {
-                if (onReasoning) {
-                    await onReasoning(response.message);
+        const completion = (async () => {
+            for (;;) {
+                const idx = this.idx++;
+                const response = this.responses[idx % this.responses.length];
+                if (response.finish_reason === "error") {
+                    throw new Error(response.message);
                 }
-                continue;
-            }
-            if (onMessage) {
-                const message = response.message;
-                void onMessage(message.content || "", true);
+                if (response.finish_reason === "reasoning") {
+                    if (onReasoning) {
+                        await onReasoning(response.message);
+                    }
+                    continue;
+                }
+                if (onMessage) {
+                    const message = response.message;
+                    void onMessage(message.content || "", true);
+                }
+                return {
+                    id: String(idx),
+                    choices: [response],
+                    created: Date.now(),
+                    model: "dummyLlmModel",
+                    object: "chat.completion",
+                };
             }
-            return {
-                id: String(this.idx),
-                choices: [response],
-                created: Date.now(),
-                model: "dummyLlmModel",
-                object: "chat.completion",
-            };
-        }
+        })();
+        return { stop: () => { }, completion };
     }
     setModel(_model) {
         (0, assert_1.strict)(false, "unexpected call to setModel");

package/dist/agent/src/agent/imageGenLLM.js CHANGED Viewed

@@ -27,7 +27,7 @@ class ImageGenLLM {
     getUrl() {
         return this.openai.baseURL;
     }
-    async getConversationResponse(messages, tools, onMessage) {
+    getConversationResponse(messages, tools, onMessage) {
         (0, assert_1.strict)(!tools || tools.length === 0, "tools not supported in ImageGenLLM");
         // Designed for image generation using openrouter, which tweaks the Create
         const params = {
@@ -37,25 +37,28 @@ class ImageGenLLM {
             modalities: ["image", "text"],
         };
         logger.info(`[ImageGenLLM] params; ${JSON.stringify(params)}`);
-        const completion = (await this.openai.chat.completions.create(params));
-        // logger.debug(
-        //   `[ImageGenLLM.getConversationResponse] completion:
-        //   ${JSON.stringify(completion)}`
-        // );
-        if (onMessage) {
-            const message = completion.choices[0].message;
-            if (message.content) {
-                await onMessage(message.content, true);
+        const completion = (async () => {
+            const completion = (await this.openai.chat.completions.create(params));
+            // logger.debug(
+            //   `[ImageGenLLM.getConversationResponse] completion:
+            //   ${JSON.stringify(completion)}`
+            // );
+            if (onMessage) {
+                const message = completion.choices[0].message;
+                if (message.content) {
+                    await onMessage(message.content, true);
+                }
+                if (message.images) {
+                    message.images.forEach((image, index) => {
+                        const imageUrl = image.image_url.url; // Base64 data URL
+                        const truncated = imageUrl.substring(0, 50);
+                        logger.info(`[ImageGenLLM] ${String(index + 1)}: ${truncated}...`);
+                    });
+                }
             }
-            if (message.images) {
-                message.images.forEach((image, index) => {
-                    const imageUrl = image.image_url.url; // Base64 data URL
-                    const truncated = imageUrl.substring(0, 50);
-                    logger.info(`[ImageGenLLM] ${String(index + 1)}: ${truncated}...`);
-                });
-            }
-        }
-        return completion;
+            return completion;
+        })();
+        return Promise.resolve({ stop: () => { }, completion });
     }
 }
 exports.ImageGenLLM = ImageGenLLM;

package/dist/agent/src/agent/llm.js CHANGED Viewed

@@ -2,6 +2,6 @@
 Object.defineProperty(exports, "__esModule", { value: true });
 exports.XALIA_APP_HEADER = void 0;
 exports.XALIA_APP_HEADER = {
-    "HTTP-Referer": "xalia.ai",
+    "HTTP-Referer": "https://xalia.ai",
     "X-Title": "Xalia",
 };

package/dist/agent/src/agent/openAILLM.js CHANGED Viewed

@@ -46,19 +46,22 @@ class OpenAILLM {
     getUrl() {
         return this.openai.baseURL;
     }
-    async getConversationResponse(messages, tools, onMessage) {
-        const completion = await this.openai.chat.completions.create({
-            model: this.model,
-            messages,
-            tools,
-        });
-        if (onMessage) {
-            const message = completion.choices[0].message;
-            if (message.content) {
-                await onMessage(message.content, true);
+    getConversationResponse(messages, tools, onMessage) {
+        const completion = (async () => {
+            const completion = await this.openai.chat.completions.create({
+                model: this.model,
+                messages,
+                tools,
+            });
+            if (onMessage) {
+                const message = completion.choices[0].message;
+                if (message.content) {
+                    await onMessage(message.content, true);
+                }
             }
-        }
-        return completionFromOpenAI(completion);
+            return completionFromOpenAI(completion);
+        })();
+        return Promise.resolve({ stop: () => { }, completion });
     }
 }
 exports.OpenAILLM = OpenAILLM;

package/dist/agent/src/agent/openAILLMStreaming.js CHANGED Viewed

@@ -439,47 +439,78 @@ class OpenAILLMStreaming {
         if (!chunks.iterator) {
             throw new Error("not a stream");
         }
-        let aggregatedMessage;
-        for await (const chunk of chunks) {
-            logger.debug(`[stream] chunk: ${JSON.stringify(chunk)}`);
-            // eslint-disable-next-line @typescript-eslint/no-unnecessary-condition
-            if (chunk.object !== "chat.completion.chunk") {
-                // logger.warn("[stream]: unexpected message");
-                continue;
-            }
-            if (!aggregatedMessage) {
-                logger.debug(`[stream] first}`);
-                const { initMessage } = initializeCompletion(chunk);
-                aggregatedMessage = initMessage;
-            }
-            else {
-                updateCompletion(aggregatedMessage, chunk);
-            }
-            if (onMessage) {
-                // Inform the call of a message fragment if it contains any text.
-                // Note: chunks may have zero choices (e.g., usage-only chunks), so
-                // we safely access the first choice.
-                const delta = chunk.choices[0]?.delta;
+        let stopMsg = undefined;
+        const stop = (msg) => {
+            stopMsg = msg;
+        };
+        const completion = (async () => {
+            // Completion built up over successive calls to processChunk.
+            let aggregatedMessage;
+            const processChunk = async (chunk) => {
                 // eslint-disable-next-line @typescript-eslint/no-unnecessary-condition
-                if (delta?.content) {
-                    await onMessage(delta.content, false);
+                if (chunk.object !== "chat.completion.chunk") {
+                    // logger.warn("[stream]: unexpected message");
+                    return;
                 }
-            }
-            if (onReasoning) {
-                const delta = chunk.choices[0]
-                    ?.delta;
-                const reasoning = (0, openAI_1.choiceDeltaExtractReasoning)(delta);
-                if (reasoning) {
-                    await onReasoning(reasoning);
+                if (!aggregatedMessage) {
+                    logger.debug(`[stream] first}`);
+                    const { initMessage } = initializeCompletion(chunk);
+                    aggregatedMessage = initMessage;
+                }
+                else {
+                    updateCompletion(aggregatedMessage, chunk);
                 }
+                if (onMessage) {
+                    // Inform the call of a message fragment if it contains any text.
+                    // Note: chunks may have zero choices (e.g., usage-only chunks), so
+                    // we safely access the first choice.
+                    const delta = chunk.choices[0]?.delta;
+                    // eslint-disable-next-line
+                    if (delta?.content) {
+                        await onMessage(delta.content, false);
+                    }
+                }
+                if (onReasoning) {
+                    const delta = chunk.choices[0]
+                        ?.delta;
+                    const reasoning = (0, openAI_1.choiceDeltaExtractReasoning)(delta);
+                    if (reasoning) {
+                        await onReasoning(reasoning);
+                    }
+                }
+            };
+            // Process each chunk, checking for a stop signal.
+            for await (const chunk of chunks) {
+                logger.debug(`[stream] chunk: ${JSON.stringify(chunk)}`);
+                await processChunk(chunk);
+                /* eslint-disable @typescript-eslint/no-unnecessary-condition */
+                if (stopMsg) {
+                    const choice = {
+                        delta: { content: stopMsg },
+                        finish_reason: aggregatedMessage && aggregatedMessage.choices[0].finish_reason
+                            ? null
+                            : "stop",
+                        index: 0,
+                    };
+                    await processChunk({
+                        id: aggregatedMessage?.id || "user_stop_chunk",
+                        created: aggregatedMessage?.created || Date.now(),
+                        model: aggregatedMessage?.model || model,
+                        object: "chat.completion.chunk",
+                        choices: [choice],
+                    });
+                    break;
+                }
+                /* eslint-enable @typescript-eslint/no-unnecessary-condition */
             }
-        }
-        if (onMessage) {
-            await onMessage("", true);
-        }
-        logger.debug(`[stream] final message: ${JSON.stringify(aggregatedMessage)}`);
-        (0, assert_1.strict)(aggregatedMessage);
-        return aggregatedMessage;
+            if (onMessage) {
+                await onMessage("", true);
+            }
+            logger.debug(`[stream] final message: ${JSON.stringify(aggregatedMessage)}`);
+            (0, assert_1.strict)(aggregatedMessage);
+            return aggregatedMessage;
+        })();
+        return { stop, completion };
     }
 }
 exports.OpenAILLMStreaming = OpenAILLMStreaming;