npm - omnikey-cli - Versions diffs - 1.0.18 → 1.0.20 - Mend

omnikey-cli 1.0.18 → 1.0.20

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/backend-dist/agent/agentPrompts.js +5 -3
package/backend-dist/agent/agentServer.js +61 -2
package/backend-dist/featureRoutes.js +2 -2
package/backend-dist/index.js +3 -3
package/package.json +1 -1

package/backend-dist/agent/agentPrompts.js CHANGED Viewed

@@ -26,14 +26,16 @@ ${hasTaskInstructions
 - If a request needs BOTH machine data AND web search: emit a \`<shell_script>\` first → wait for \`TERMINAL OUTPUT:\` → then call the web tool with concrete values. Never use placeholders like "my IP" in a web query.
 **Incoming message tags:**
-- \`TERMINAL OUTPUT:\` — stdout/stderr from a prior script. Use it to continue reasoning or emit a follow-up.
+- \`TERMINAL OUTPUT:\` — stdout/stderr from a prior script. Analyze it immediately and respond with EITHER a follow-up \`<shell_script>\` (if more data is needed) OR a \`<final_answer>\` (if you have enough to conclude). You MUST pick one — never respond with plain text.
 - \`COMMAND ERROR:\` — script failed. Diagnose and emit a corrected \`<shell_script>\` or explain in \`<final_answer>\`.
 - No prefix — direct user message; treat as the primary request.
 **Response format — every response must be exactly one of:**
-1. \`<shell_script>...</shell_script>\` — to run commands.
+1. \`<shell_script>...</shell_script>\` — to run commands and gather more data.
 2. A \`web_search\` or \`web_fetch\` tool call — to fetch web context (use native tool calling, not XML tags).
-3. \`<final_answer>...</final_answer>\` — when done.
+3. \`<final_answer>...</final_answer>\` — your conclusion once you have enough information.
+**Critical rule:** After receiving \`TERMINAL OUTPUT:\` you MUST immediately produce either \`<shell_script>\` or \`<final_answer>\`. Never output raw text, markdown, or any other format. If the terminal output contains enough information to answer the user's request, output \`<final_answer>\` right away.
 No plain text, reasoning, or other tags outside these blocks. Never wrap in additional XML/JSON.

package/backend-dist/agent/agentServer.js CHANGED Viewed

@@ -105,9 +105,27 @@ async function runToolLoop(initialResult, session, sessionId, send, log, tools,
         });
         await onUsage(result);
     }
+    // If we exhausted the iteration cap and the model still wants to call tools,
+    // force a final text response by calling again without tools.
+    if (result.finish_reason === 'tool_calls') {
+        log.warn('Tool loop hit MAX_TOOL_ITERATIONS; forcing final conclusion', { sessionId });
+        session.history.push(result.assistantMessage);
+        session.history.push({
+            role: 'user',
+            content: 'You have reached the maximum number of tool calls. Based on all the information gathered so far, provide a single, final, concise answer. Do not call any more tools.',
+        });
+        result = await ai_client_1.aiClient.complete(aiModel, session.history, {
+            tools: undefined,
+            temperature: 0.2,
+        });
+        await onUsage(result);
+    }
     log.info('Finished reasoning and tool calls: ', {
         reason: result.finish_reason,
     });
+    if (result.assistantMessage) {
+        session.history.push(result.assistantMessage);
+    }
     return result;
 }
 function buildAvailableTools() {
@@ -239,7 +257,12 @@ async function authenticateFromAuthHeader(authHeader, log) {
     }
 }
 function createUserContent(content, hasStoredPrompt) {
-    return hasStoredPrompt ? content.replace(/@omniAgent/g, '').trim() : content;
+    return hasStoredPrompt
+        ? content
+            .toLowerCase()
+            .replace(/@omniagent/g, '')
+            .trim()
+        : content;
 }
 async function runAgentTurn(sessionId, subscription, clientMessage, send, log) {
     const { sessionState: session, hasStoredPrompt } = await getOrCreateSession(sessionId, subscription, clientMessage.platform, log);
@@ -278,6 +301,10 @@ async function runAgentTurn(sessionId, subscription, clientMessage, send, log) {
     });
     const isAssistance = isTerminalOutput || isErrorFlag;
     if (!clientMessage?.is_web_call) {
+        // Terminal output and command errors are always user-role messages — they
+        // represent environment feedback that the agent must reason about next.
+        // Pushing them as 'assistant' would create two consecutive assistant turns
+        // which breaks most LLM APIs and prevents the model from processing the output.
         session.history.push({
             role: 'user',
             content: isAssistance
@@ -291,7 +318,7 @@ async function runAgentTurn(sessionId, subscription, clientMessage, send, log) {
     const tools = isFinalTurn ? undefined : buildAvailableTools();
     const recordUsage = async (result) => {
         const usage = result.usage;
-        if (!usage || !subscription.id)
+        if (!usage || !subscription.id || config_1.config.isSelfHosted)
             return;
         try {
             await subscriptionUsage_1.SubscriptionUsage.create({
@@ -352,6 +379,13 @@ async function runAgentTurn(sessionId, subscription, clientMessage, send, log) {
                 sessionMessages.delete(sessionId);
                 return;
             }
+            await runAgentTurn(sessionId, subscription, {
+                sender: 'agent',
+                session_id: sessionId,
+                content: '',
+                is_web_call: true,
+            }, send, logger_1.logger);
+            return;
         }
         // Ensure that a proper <final_answer> block is produced for the
         // desktop clients once we reach the final turn. If the model did
@@ -395,6 +429,31 @@ async function runAgentTurn(sessionId, subscription, clientMessage, send, log) {
             });
             sessionMessages.delete(sessionId);
         }
+        else if (content) {
+            // Fallback: the LLM returned content without any recognized tag and it
+            // is not the final turn (e.g. plain-text conclusion after terminal
+            // output). Treat it as a final answer so the client is never left
+            // hanging.
+            log.info('Agent returned untagged content on a non-final turn; treating as final answer', {
+                sessionId,
+                subscriptionId: subscription.id,
+                turn: session.turns,
+            });
+            session.history.push({ role: 'assistant', content });
+            send({
+                session_id: sessionId,
+                sender: 'agent',
+                content: `<final_answer>\n${content}\n</final_answer>`,
+            });
+            sessionMessages.delete(sessionId);
+        }
+        else {
+            log.warn('Agent returned empty content with no recognized tags; sending error', {
+                sessionId,
+            });
+            sendFinalAnswer(send, sessionId, 'The agent returned an empty response. Please try again.', true);
+            sessionMessages.delete(sessionId);
+        }
     }
     catch (err) {
         log.error('Agent LLM call failed', { error: err });

package/backend-dist/featureRoutes.js CHANGED Viewed

@@ -118,7 +118,7 @@ async function enhanceText(logger, text, cmd, subscription) {
         const { rawResponse, usage, model } = result;
         // Record token usage for this subscription and model, if usage
         // data is available and we know which subscription made the call.
-        if (usage && subscription.id) {
+        if (usage && subscription.id && !config_1.config.isSelfHosted) {
             try {
                 await subscriptionUsage_1.SubscriptionUsage.create({
                     subscriptionId: subscription.id,
@@ -197,7 +197,7 @@ async function streamEnhanceResponse(res, text, cmd) {
             return;
         }
         const { usage, model } = result;
-        if (usage && subscription.id) {
+        if (usage && subscription.id && !config_1.config.isSelfHosted) {
             try {
                 await subscriptionUsage_1.SubscriptionUsage.create({
                     subscriptionId: subscription.id,

package/backend-dist/index.js CHANGED Viewed

@@ -64,8 +64,8 @@ app.get('/macos/appcast', (req, res) => {
     const appcastUrl = `${baseUrl}/macos/appcast`;
     // These should match the values embedded into the macOS app
     // Info.plist in macOS/build_release_dmg.sh.
-    const bundleVersion = '14';
-    const shortVersion = '1.0.13';
+    const bundleVersion = '16';
+    const shortVersion = '1.0.15';
     const xml = `<?xml version="1.0" encoding="utf-8"?>
 <rss version="2.0"
      xmlns:sparkle="http://www.andymatuschak.org/xml-namespaces/sparkle"
@@ -93,7 +93,7 @@ app.get('/macos/appcast', (req, res) => {
 // ── Windows distribution endpoints ───────────────────────────────────────────
 // These should match the values in windows/OmniKey.Windows.csproj
 // <Version> and windows/build_release_zip.ps1 $APP_VERSION.
-const WIN_VERSION = '1.2';
+const WIN_VERSION = '1.3';
 const WIN_ZIP_FILENAME = 'OmniKeyAI-windows-win-x64.zip';
 const WIN_ZIP_PATH = path_1.default.join(process.cwd(), 'windows', WIN_ZIP_FILENAME);
 // Serves the pre-built ZIP produced by windows/build_release_zip.ps1.

package/package.json CHANGED Viewed

@@ -4,7 +4,7 @@
     "access": "public",
     "registry": "https://registry.npmjs.org/"
   },
-  "version": "1.0.18",
+  "version": "1.0.20",
   "description": "CLI for onboarding users to Omnikey AI and configuring OPENAI_API_KEY. Use Yarn for install/build.",
   "engines": {
     "node": ">=14.0.0",