npm - @aj-archipelago/cortex - Versions diffs - 1.3.21 → 1.3.23 - Mend

@aj-archipelago/cortex 1.3.21 → 1.3.23

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (44) hide show

package/README.md +64 -0
package/config.js +26 -1
package/helper-apps/cortex-realtime-voice-server/src/cortex/memory.ts +2 -2
package/helper-apps/cortex-realtime-voice-server/src/realtime/client.ts +9 -4
package/helper-apps/cortex-realtime-voice-server/src/realtime/realtimeTypes.ts +1 -0
package/lib/util.js +5 -25
package/package.json +5 -2
package/pathways/system/entity/memory/shared/sys_memory_helpers.js +228 -0
package/pathways/system/entity/memory/sys_memory_format.js +30 -0
package/pathways/system/entity/memory/sys_memory_manager.js +85 -27
package/pathways/system/entity/memory/sys_memory_process.js +154 -0
package/pathways/system/entity/memory/sys_memory_required.js +4 -2
package/pathways/system/entity/memory/sys_memory_topic.js +22 -0
package/pathways/system/entity/memory/sys_memory_update.js +50 -150
package/pathways/system/entity/memory/sys_read_memory.js +67 -69
package/pathways/system/entity/memory/sys_save_memory.js +1 -1
package/pathways/system/entity/memory/sys_search_memory.js +1 -1
package/pathways/system/entity/sys_entity_start.js +9 -6
package/pathways/system/entity/sys_generator_image.js +5 -41
package/pathways/system/entity/sys_generator_memory.js +3 -1
package/pathways/system/entity/sys_generator_reasoning.js +1 -1
package/pathways/system/entity/sys_router_tool.js +3 -4
package/pathways/system/rest_streaming/sys_claude_35_sonnet.js +1 -1
package/pathways/system/rest_streaming/sys_claude_3_haiku.js +1 -1
package/pathways/system/rest_streaming/sys_google_gemini_chat.js +1 -1
package/pathways/system/rest_streaming/sys_ollama_chat.js +21 -0
package/pathways/system/rest_streaming/sys_ollama_completion.js +14 -0
package/pathways/system/rest_streaming/sys_openai_chat_o1.js +1 -1
package/pathways/system/rest_streaming/sys_openai_chat_o3_mini.js +1 -1
package/pathways/transcribe_gemini.js +525 -0
package/server/modelExecutor.js +8 -0
package/server/pathwayResolver.js +13 -8
package/server/plugins/claude3VertexPlugin.js +150 -18
package/server/plugins/gemini15ChatPlugin.js +90 -1
package/server/plugins/gemini15VisionPlugin.js +16 -3
package/server/plugins/modelPlugin.js +12 -9
package/server/plugins/ollamaChatPlugin.js +158 -0
package/server/plugins/ollamaCompletionPlugin.js +147 -0
package/server/rest.js +70 -8
package/tests/claude3VertexToolConversion.test.js +411 -0
package/tests/memoryfunction.test.js +560 -46
package/tests/multimodal_conversion.test.js +169 -0
package/tests/openai_api.test.js +332 -0
package/tests/transcribe_gemini.test.js +217 -0

package/server/plugins/ollamaCompletionPlugin.js ADDED Viewed

@@ -0,0 +1,147 @@
+import ModelPlugin from './modelPlugin.js';
+import logger from '../../lib/logger.js';
+import { Transform } from 'stream';
+class OllamaCompletionPlugin extends ModelPlugin {
+  getRequestParameters(text, parameters, prompt) {
+    return {
+      data: {
+        model: parameters.ollamaModel,
+        prompt: text,
+        stream: parameters.stream
+      },
+      params: {}
+    };
+  }
+  logRequestData(data, responseData, prompt) {
+    const { stream, prompt: promptText, model } = data;
+    if (promptText) {
+      logger.info(`[ollama completion request sent to model ${model}]`);
+      const { length, units } = this.getLength(promptText);
+      const preview = this.shortenContent(promptText);
+      logger.verbose(`prompt ${units}: ${length}, content: "${preview}"`);
+      logger.info(`[completion request contained ${length} ${units}]`);
+    }
+    if (stream) {
+      logger.info(`[response received as an SSE stream]`);
+    } else if (responseData) {
+      const responseText = this.parseResponse(responseData);
+      const { length, units } = this.getLength(responseText);
+      logger.info(`[response received containing ${length} ${units}]`);
+      logger.verbose(`${this.shortenContent(responseText)}`);
+    }
+    prompt &&
+      prompt.debugInfo &&
+      (prompt.debugInfo += `\n${JSON.stringify(data)}`);
+  }
+  parseResponse(data) {
+    // If data is not a string (e.g. streaming), return as is
+    if (typeof data !== 'string') {
+      return data;
+    }
+    // Split into lines and filter empty ones
+    const lines = data.split('\n').filter(line => line.trim());
+    let fullResponse = '';
+    for (const line of lines) {
+      try {
+        const jsonObj = JSON.parse(line);
+        if (jsonObj.response) {
+          // Unescape special sequences
+          const content = jsonObj.response
+            .replace(/\\n/g, '\n')
+            .replace(/\\"/g, '"')
+            .replace(/\\\\/g, '\\')
+            .replace(/\\u003c/g, '<')
+            .replace(/\\u003e/g, '>');
+          fullResponse += content;
+        }
+      } catch (err) {
+        // If we can't parse the line as JSON, just skip it
+        continue;
+      }
+    }
+    return fullResponse;
+  }
+  processStreamEvent(event, requestProgress) {
+    try {
+      const data = JSON.parse(event.data);
+      // Handle the streaming response
+      if (data.response) {
+        // Unescape special sequences in the content
+        const content = data.response
+          .replace(/\\n/g, '\n')
+          .replace(/\\"/g, '"')
+          .replace(/\\\\/g, '\\')
+          .replace(/\\u003c/g, '<')
+          .replace(/\\u003e/g, '>');
+        requestProgress.data = JSON.stringify(content);
+      }
+      // Check if this is the final message
+      if (data.done) {
+        requestProgress.data = '[DONE]';
+        requestProgress.progress = 1;
+      }
+      return requestProgress;
+    } catch (err) {
+      // If we can't parse the event data, return the progress as is
+      return requestProgress;
+    }
+  }
+  async execute(text, parameters, prompt, cortexRequest) {
+    const requestParameters = this.getRequestParameters(text, parameters, prompt);
+    cortexRequest.data = { ...(cortexRequest.data || {}), ...requestParameters.data };
+    cortexRequest.params = { ...(cortexRequest.params || {}), ...requestParameters.params };
+    // For Ollama streaming, transform NDJSON to SSE format
+    if (parameters.stream) {
+      const response = await this.executeRequest(cortexRequest);
+      // Create a transform stream that converts NDJSON to SSE format
+      const transformer = new Transform({
+        decodeStrings: false, // Keep as string
+        transform(chunk, encoding, callback) {
+          try {
+            const lines = chunk.toString().split('\n');
+            for (const line of lines) {
+              if (line.trim()) {
+                // Format as SSE data
+                this.push(`data: ${line}\n\n`);
+              }
+            }
+            callback();
+          } catch (err) {
+            callback(err);
+          }
+        }
+      });
+      // Pipe the response through our transformer
+      response.pipe(transformer);
+      // Return the transformed stream
+      return transformer;
+    }
+    return this.executeRequest(cortexRequest);
+  }
+}
+export default OllamaCompletionPlugin;

package/server/rest.js CHANGED Viewed

@@ -6,6 +6,22 @@ import { requestState } from './requestState.js';
 import { v4 as uuidv4 } from 'uuid';
 import logger from '../lib/logger.js';
 import { getSingleTokenChunks } from './chunker.js';
+import axios from 'axios';
+const getOllamaModels = async (ollamaUrl) => {
+    try {
+        const response = await axios.get(`${ollamaUrl}/api/tags`);
+        return response.data.models.map(model => ({
+            id: `ollama-${model.name}`,
+            object: 'model',
+            owned_by: 'ollama',
+            permission: ''
+        }));
+    } catch (error) {
+        logger.error(`Error fetching Ollama models: ${error.message}`);
+        return [];
+    }
+};
 const chunkTextIntoTokens = (() => {
     let partialToken = '';
@@ -28,6 +44,13 @@ const processRestRequest = async (server, req, pathway, name, parameterMap = {})
             return Boolean(value);
         } else if (type === 'Int') {
             return parseInt(value, 10);
+        } else if (type === '[MultiMessage]' && Array.isArray(value)) {
+            return value.map(msg => ({
+                ...msg,
+                content: Array.isArray(msg.content) ?
+                    JSON.stringify(msg.content) :
+                    msg.content
+            }));
         } else {
             return value;
         }
@@ -58,8 +81,16 @@ const processRestRequest = async (server, req, pathway, name, parameterMap = {})
             `;
     const result = await server.executeOperation({ query, variables });
-    const resultText = result?.body?.singleResult?.data?.[name]?.result || result?.body?.singleResult?.errors?.[0]?.message || "";
+    // if we're streaming and there are errors, we return a standard error code
+    if (Boolean(req.body.stream)) {
+        if (result?.body?.singleResult?.errors) {
+            return `[ERROR] ${result.body.singleResult.errors[0].message.split(';')[0]}`;
+        }
+    }
+    // otherwise errors can just be returned as a string
+    const resultText = result?.body?.singleResult?.data?.[name]?.result || result?.body?.singleResult?.errors?.[0]?.message || "";
     return resultText;
 };
@@ -86,7 +117,6 @@ const processIncomingStream = (requestId, res, jsonResponse, pathway) => {
         // If we haven't sent the stop message yet, do it now
         if (jsonResponse.choices?.[0]?.finish_reason !== "stop") {
             let jsonEndStream = JSON.parse(JSON.stringify(jsonResponse));
             if (jsonEndStream.object === 'text_completion') {
@@ -116,7 +146,6 @@ const processIncomingStream = (requestId, res, jsonResponse, pathway) => {
     }
     const fillJsonResponse = (jsonResponse, inputText, _finishReason) => {
         jsonResponse.choices[0].finish_reason = null;
         if (jsonResponse.object === 'text_completion') {
             jsonResponse.choices[0].text = inputText;
@@ -129,6 +158,14 @@ const processIncomingStream = (requestId, res, jsonResponse, pathway) => {
     startStream(res);
+    // If the requestId is an error message, we can't continue
+    if (requestId.startsWith('[ERROR]')) {
+        fillJsonResponse(jsonResponse, requestId, "stop");
+        sendStreamData(jsonResponse);
+        finishStream(res, jsonResponse);
+        return;
+    }
     let subscription;
     subscription = pubsub.subscribe('REQUEST_PROGRESS', (data) => {
@@ -261,7 +298,14 @@ function buildRestEndpoints(pathways, app, server, config) {
         // Create OpenAI compatible endpoints
         app.post('/v1/completions', async (req, res) => {
             const modelName = req.body.model || 'gpt-3.5-turbo';
-            const pathwayName = openAICompletionModels[modelName] || openAICompletionModels['*'];
+            let pathwayName;
+            if (modelName.startsWith('ollama-')) {
+                pathwayName = 'sys_ollama_completion';
+                req.body.ollamaModel = modelName.replace('ollama-', '');
+            } else {
+                pathwayName = openAICompletionModels[modelName] || openAICompletionModels['*'];
+            }
             if (!pathwayName) {
                 res.status(404).json({
@@ -297,7 +341,6 @@ function buildRestEndpoints(pathways, app, server, config) {
             if (Boolean(req.body.stream)) {
                 jsonResponse.id = `cmpl-${resultText}`;
                 jsonResponse.choices[0].finish_reason = null;
-                //jsonResponse.object = "text_completion.chunk";
                 processIncomingStream(resultText, res, jsonResponse, pathway);
             } else {
@@ -309,7 +352,14 @@ function buildRestEndpoints(pathways, app, server, config) {
         app.post('/v1/chat/completions', async (req, res) => {
             const modelName = req.body.model || 'gpt-3.5-turbo';
-            const pathwayName = openAIChatModels[modelName] || openAIChatModels['*'];
+            let pathwayName;
+            if (modelName.startsWith('ollama-')) {
+                pathwayName = 'sys_ollama_chat';
+                req.body.ollamaModel = modelName.replace('ollama-', '');
+            } else {
+                pathwayName = openAIChatModels[modelName] || openAIChatModels['*'];
+            }
             if (!pathwayName) {
                 res.status(404).json({
@@ -364,8 +414,11 @@ function buildRestEndpoints(pathways, app, server, config) {
         app.get('/v1/models', async (req, res) => {
             const openAIModels = { ...openAIChatModels, ...openAICompletionModels };
             const defaultModelId = 'gpt-3.5-turbo';
+            let models = [];
-            const models = Object.entries(openAIModels)
+            // Get standard OpenAI-compatible models, filtering out our internal pathway models
+            models = Object.entries(openAIModels)
+                .filter(([modelId]) => !['ollama-chat', 'ollama-completion'].includes(modelId))
                 .map(([modelId]) => {
                     if (modelId.includes('*')) {
                         modelId = defaultModelId;
@@ -376,7 +429,16 @@ function buildRestEndpoints(pathways, app, server, config) {
                         owned_by: 'openai',
                         permission: '',
                     };
-                })
+                });
+            // Get Ollama models if configured
+            if (config.get('ollamaUrl')) {
+                const ollamaModels = await getOllamaModels(config.get('ollamaUrl'));
+                models = [...models, ...ollamaModels];
+            }
+            // Filter out duplicates and sort
+            models = models
                 .filter((model, index, self) => {
                     return index === self.findIndex((m) => m.id === model.id);
                 })